xref: /freebsd/sys/dev/cxgbe/t4_sge.c (revision 5cdaef71a95787a1c8fb62239896307850cc73f9)
154e4ee71SNavdeep Parhar /*-
2718cf2ccSPedro F. Giffuni  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3718cf2ccSPedro F. Giffuni  *
454e4ee71SNavdeep Parhar  * Copyright (c) 2011 Chelsio Communications, Inc.
554e4ee71SNavdeep Parhar  * All rights reserved.
654e4ee71SNavdeep Parhar  * Written by: Navdeep Parhar <np@FreeBSD.org>
754e4ee71SNavdeep Parhar  *
854e4ee71SNavdeep Parhar  * Redistribution and use in source and binary forms, with or without
954e4ee71SNavdeep Parhar  * modification, are permitted provided that the following conditions
1054e4ee71SNavdeep Parhar  * are met:
1154e4ee71SNavdeep Parhar  * 1. Redistributions of source code must retain the above copyright
1254e4ee71SNavdeep Parhar  *    notice, this list of conditions and the following disclaimer.
1354e4ee71SNavdeep Parhar  * 2. Redistributions in binary form must reproduce the above copyright
1454e4ee71SNavdeep Parhar  *    notice, this list of conditions and the following disclaimer in the
1554e4ee71SNavdeep Parhar  *    documentation and/or other materials provided with the distribution.
1654e4ee71SNavdeep Parhar  *
1754e4ee71SNavdeep Parhar  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1854e4ee71SNavdeep Parhar  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1954e4ee71SNavdeep Parhar  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2054e4ee71SNavdeep Parhar  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2154e4ee71SNavdeep Parhar  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2254e4ee71SNavdeep Parhar  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2354e4ee71SNavdeep Parhar  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2454e4ee71SNavdeep Parhar  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2554e4ee71SNavdeep Parhar  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2654e4ee71SNavdeep Parhar  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2754e4ee71SNavdeep Parhar  * SUCH DAMAGE.
2854e4ee71SNavdeep Parhar  */
2954e4ee71SNavdeep Parhar 
3054e4ee71SNavdeep Parhar #include <sys/cdefs.h>
3154e4ee71SNavdeep Parhar __FBSDID("$FreeBSD$");
3254e4ee71SNavdeep Parhar 
3354e4ee71SNavdeep Parhar #include "opt_inet.h"
34a1ea9a82SNavdeep Parhar #include "opt_inet6.h"
35eff62dbaSNavdeep Parhar #include "opt_ratelimit.h"
3654e4ee71SNavdeep Parhar 
3754e4ee71SNavdeep Parhar #include <sys/types.h>
38c3322cb9SGleb Smirnoff #include <sys/eventhandler.h>
3954e4ee71SNavdeep Parhar #include <sys/mbuf.h>
4054e4ee71SNavdeep Parhar #include <sys/socket.h>
4154e4ee71SNavdeep Parhar #include <sys/kernel.h>
42ecb79ca4SNavdeep Parhar #include <sys/malloc.h>
43ecb79ca4SNavdeep Parhar #include <sys/queue.h>
4438035ed6SNavdeep Parhar #include <sys/sbuf.h>
45ecb79ca4SNavdeep Parhar #include <sys/taskqueue.h>
46480e603cSNavdeep Parhar #include <sys/time.h>
477951040fSNavdeep Parhar #include <sys/sglist.h>
4854e4ee71SNavdeep Parhar #include <sys/sysctl.h>
49733b9277SNavdeep Parhar #include <sys/smp.h>
5082eff304SNavdeep Parhar #include <sys/counter.h>
5154e4ee71SNavdeep Parhar #include <net/bpf.h>
5254e4ee71SNavdeep Parhar #include <net/ethernet.h>
5354e4ee71SNavdeep Parhar #include <net/if.h>
5454e4ee71SNavdeep Parhar #include <net/if_vlan_var.h>
5554e4ee71SNavdeep Parhar #include <netinet/in.h>
5654e4ee71SNavdeep Parhar #include <netinet/ip.h>
57a1ea9a82SNavdeep Parhar #include <netinet/ip6.h>
5854e4ee71SNavdeep Parhar #include <netinet/tcp.h>
59786099deSNavdeep Parhar #include <netinet/udp.h>
606af45170SJohn Baldwin #include <machine/in_cksum.h>
6164db8966SDimitry Andric #include <machine/md_var.h>
6238035ed6SNavdeep Parhar #include <vm/vm.h>
6338035ed6SNavdeep Parhar #include <vm/pmap.h>
64298d969cSNavdeep Parhar #ifdef DEV_NETMAP
65298d969cSNavdeep Parhar #include <machine/bus.h>
66298d969cSNavdeep Parhar #include <sys/selinfo.h>
67298d969cSNavdeep Parhar #include <net/if_var.h>
68298d969cSNavdeep Parhar #include <net/netmap.h>
69298d969cSNavdeep Parhar #include <dev/netmap/netmap_kern.h>
70298d969cSNavdeep Parhar #endif
7154e4ee71SNavdeep Parhar 
7254e4ee71SNavdeep Parhar #include "common/common.h"
7354e4ee71SNavdeep Parhar #include "common/t4_regs.h"
7454e4ee71SNavdeep Parhar #include "common/t4_regs_values.h"
7554e4ee71SNavdeep Parhar #include "common/t4_msg.h"
76671bf2b8SNavdeep Parhar #include "t4_l2t.h"
777951040fSNavdeep Parhar #include "t4_mp_ring.h"
7854e4ee71SNavdeep Parhar 
79d14b0ac1SNavdeep Parhar #ifdef T4_PKT_TIMESTAMP
80d14b0ac1SNavdeep Parhar #define RX_COPY_THRESHOLD (MINCLSIZE - 8)
81d14b0ac1SNavdeep Parhar #else
82d14b0ac1SNavdeep Parhar #define RX_COPY_THRESHOLD MINCLSIZE
83d14b0ac1SNavdeep Parhar #endif
84d14b0ac1SNavdeep Parhar 
85*5cdaef71SJohn Baldwin /* Internal mbuf flags stored in PH_loc.eight[1]. */
86*5cdaef71SJohn Baldwin #define	MC_RAW_WR		0x02
87*5cdaef71SJohn Baldwin 
889fb8886bSNavdeep Parhar /*
899fb8886bSNavdeep Parhar  * Ethernet frames are DMA'd at this byte offset into the freelist buffer.
909fb8886bSNavdeep Parhar  * 0-7 are valid values.
919fb8886bSNavdeep Parhar  */
92518bca2cSNavdeep Parhar static int fl_pktshift = 0;
939fb8886bSNavdeep Parhar TUNABLE_INT("hw.cxgbe.fl_pktshift", &fl_pktshift);
9454e4ee71SNavdeep Parhar 
959fb8886bSNavdeep Parhar /*
969fb8886bSNavdeep Parhar  * Pad ethernet payload up to this boundary.
979fb8886bSNavdeep Parhar  * -1: driver should figure out a good value.
981458bff9SNavdeep Parhar  *  0: disable padding.
991458bff9SNavdeep Parhar  *  Any power of 2 from 32 to 4096 (both inclusive) is also a valid value.
1009fb8886bSNavdeep Parhar  */
101298d969cSNavdeep Parhar int fl_pad = -1;
1029fb8886bSNavdeep Parhar TUNABLE_INT("hw.cxgbe.fl_pad", &fl_pad);
1039fb8886bSNavdeep Parhar 
1049fb8886bSNavdeep Parhar /*
1059fb8886bSNavdeep Parhar  * Status page length.
1069fb8886bSNavdeep Parhar  * -1: driver should figure out a good value.
1079fb8886bSNavdeep Parhar  *  64 or 128 are the only other valid values.
1089fb8886bSNavdeep Parhar  */
10929c229e9SJohn Baldwin static int spg_len = -1;
1109fb8886bSNavdeep Parhar TUNABLE_INT("hw.cxgbe.spg_len", &spg_len);
1119fb8886bSNavdeep Parhar 
1129fb8886bSNavdeep Parhar /*
1139fb8886bSNavdeep Parhar  * Congestion drops.
1149fb8886bSNavdeep Parhar  * -1: no congestion feedback (not recommended).
1159fb8886bSNavdeep Parhar  *  0: backpressure the channel instead of dropping packets right away.
1169fb8886bSNavdeep Parhar  *  1: no backpressure, drop packets for the congested queue immediately.
1179fb8886bSNavdeep Parhar  */
1189fb8886bSNavdeep Parhar static int cong_drop = 0;
1199fb8886bSNavdeep Parhar TUNABLE_INT("hw.cxgbe.cong_drop", &cong_drop);
12054e4ee71SNavdeep Parhar 
1211458bff9SNavdeep Parhar /*
1221458bff9SNavdeep Parhar  * Deliver multiple frames in the same free list buffer if they fit.
1231458bff9SNavdeep Parhar  * -1: let the driver decide whether to enable buffer packing or not.
1241458bff9SNavdeep Parhar  *  0: disable buffer packing.
1251458bff9SNavdeep Parhar  *  1: enable buffer packing.
1261458bff9SNavdeep Parhar  */
1271458bff9SNavdeep Parhar static int buffer_packing = -1;
1281458bff9SNavdeep Parhar TUNABLE_INT("hw.cxgbe.buffer_packing", &buffer_packing);
1291458bff9SNavdeep Parhar 
1301458bff9SNavdeep Parhar /*
1311458bff9SNavdeep Parhar  * Start next frame in a packed buffer at this boundary.
1321458bff9SNavdeep Parhar  * -1: driver should figure out a good value.
133e3207e19SNavdeep Parhar  * T4: driver will ignore this and use the same value as fl_pad above.
134e3207e19SNavdeep Parhar  * T5: 16, or a power of 2 from 64 to 4096 (both inclusive) is a valid value.
1351458bff9SNavdeep Parhar  */
1361458bff9SNavdeep Parhar static int fl_pack = -1;
1371458bff9SNavdeep Parhar TUNABLE_INT("hw.cxgbe.fl_pack", &fl_pack);
1381458bff9SNavdeep Parhar 
13938035ed6SNavdeep Parhar /*
14038035ed6SNavdeep Parhar  * Allow the driver to create mbuf(s) in a cluster allocated for rx.
14138035ed6SNavdeep Parhar  * 0: never; always allocate mbufs from the zone_mbuf UMA zone.
14238035ed6SNavdeep Parhar  * 1: ok to create mbuf(s) within a cluster if there is room.
14338035ed6SNavdeep Parhar  */
14438035ed6SNavdeep Parhar static int allow_mbufs_in_cluster = 1;
14538035ed6SNavdeep Parhar TUNABLE_INT("hw.cxgbe.allow_mbufs_in_cluster", &allow_mbufs_in_cluster);
14638035ed6SNavdeep Parhar 
14738035ed6SNavdeep Parhar /*
14838035ed6SNavdeep Parhar  * Largest rx cluster size that the driver is allowed to allocate.
14938035ed6SNavdeep Parhar  */
15038035ed6SNavdeep Parhar static int largest_rx_cluster = MJUM16BYTES;
15138035ed6SNavdeep Parhar TUNABLE_INT("hw.cxgbe.largest_rx_cluster", &largest_rx_cluster);
15238035ed6SNavdeep Parhar 
15338035ed6SNavdeep Parhar /*
15438035ed6SNavdeep Parhar  * Size of cluster allocation that's most likely to succeed.  The driver will
15538035ed6SNavdeep Parhar  * fall back to this size if it fails to allocate clusters larger than this.
15638035ed6SNavdeep Parhar  */
15738035ed6SNavdeep Parhar static int safest_rx_cluster = PAGE_SIZE;
15838035ed6SNavdeep Parhar TUNABLE_INT("hw.cxgbe.safest_rx_cluster", &safest_rx_cluster);
15938035ed6SNavdeep Parhar 
160786099deSNavdeep Parhar #ifdef RATELIMIT
161786099deSNavdeep Parhar /*
162786099deSNavdeep Parhar  * Knob to control TCP timestamp rewriting, and the granularity of the tick used
163786099deSNavdeep Parhar  * for rewriting.  -1 and 0-3 are all valid values.
164786099deSNavdeep Parhar  * -1: hardware should leave the TCP timestamps alone.
165786099deSNavdeep Parhar  * 0: 1ms
166786099deSNavdeep Parhar  * 1: 100us
167786099deSNavdeep Parhar  * 2: 10us
168786099deSNavdeep Parhar  * 3: 1us
169786099deSNavdeep Parhar  */
170786099deSNavdeep Parhar static int tsclk = -1;
171786099deSNavdeep Parhar TUNABLE_INT("hw.cxgbe.tsclk", &tsclk);
172786099deSNavdeep Parhar 
173786099deSNavdeep Parhar static int eo_max_backlog = 1024 * 1024;
174786099deSNavdeep Parhar TUNABLE_INT("hw.cxgbe.eo_max_backlog", &eo_max_backlog);
175786099deSNavdeep Parhar #endif
176786099deSNavdeep Parhar 
177d491f8caSNavdeep Parhar /*
178d491f8caSNavdeep Parhar  * The interrupt holdoff timers are multiplied by this value on T6+.
179d491f8caSNavdeep Parhar  * 1 and 3-17 (both inclusive) are legal values.
180d491f8caSNavdeep Parhar  */
181d491f8caSNavdeep Parhar static int tscale = 1;
182d491f8caSNavdeep Parhar TUNABLE_INT("hw.cxgbe.tscale", &tscale);
183d491f8caSNavdeep Parhar 
18446f48ee5SNavdeep Parhar /*
18546f48ee5SNavdeep Parhar  * Number of LRO entries in the lro_ctrl structure per rx queue.
18646f48ee5SNavdeep Parhar  */
18746f48ee5SNavdeep Parhar static int lro_entries = TCP_LRO_ENTRIES;
18846f48ee5SNavdeep Parhar TUNABLE_INT("hw.cxgbe.lro_entries", &lro_entries);
18946f48ee5SNavdeep Parhar 
19046f48ee5SNavdeep Parhar /*
19146f48ee5SNavdeep Parhar  * This enables presorting of frames before they're fed into tcp_lro_rx.
19246f48ee5SNavdeep Parhar  */
19346f48ee5SNavdeep Parhar static int lro_mbufs = 0;
19446f48ee5SNavdeep Parhar TUNABLE_INT("hw.cxgbe.lro_mbufs", &lro_mbufs);
19546f48ee5SNavdeep Parhar 
19654e4ee71SNavdeep Parhar struct txpkts {
1977951040fSNavdeep Parhar 	u_int wr_type;		/* type 0 or type 1 */
1987951040fSNavdeep Parhar 	u_int npkt;		/* # of packets in this work request */
1997951040fSNavdeep Parhar 	u_int plen;		/* total payload (sum of all packets) */
2007951040fSNavdeep Parhar 	u_int len16;		/* # of 16B pieces used by this work request */
20154e4ee71SNavdeep Parhar };
20254e4ee71SNavdeep Parhar 
20354e4ee71SNavdeep Parhar /* A packet's SGL.  This + m_pkthdr has all info needed for tx */
20454e4ee71SNavdeep Parhar struct sgl {
2057951040fSNavdeep Parhar 	struct sglist sg;
2067951040fSNavdeep Parhar 	struct sglist_seg seg[TX_SGL_SEGS];
20754e4ee71SNavdeep Parhar };
20854e4ee71SNavdeep Parhar 
209733b9277SNavdeep Parhar static int service_iq(struct sge_iq *, int);
2103098bcfcSNavdeep Parhar static int service_iq_fl(struct sge_iq *, int);
2114d6db4e0SNavdeep Parhar static struct mbuf *get_fl_payload(struct adapter *, struct sge_fl *, uint32_t);
212733b9277SNavdeep Parhar static int t4_eth_rx(struct sge_iq *, const struct rss_header *, struct mbuf *);
213b2daa9a9SNavdeep Parhar static inline void init_iq(struct sge_iq *, struct adapter *, int, int, int);
214e3207e19SNavdeep Parhar static inline void init_fl(struct adapter *, struct sge_fl *, int, int, char *);
21590e7434aSNavdeep Parhar static inline void init_eq(struct adapter *, struct sge_eq *, int, int, uint8_t,
21690e7434aSNavdeep Parhar     uint16_t, char *);
21754e4ee71SNavdeep Parhar static int alloc_ring(struct adapter *, size_t, bus_dma_tag_t *, bus_dmamap_t *,
21854e4ee71SNavdeep Parhar     bus_addr_t *, void **);
21954e4ee71SNavdeep Parhar static int free_ring(struct adapter *, bus_dma_tag_t, bus_dmamap_t, bus_addr_t,
22054e4ee71SNavdeep Parhar     void *);
221fe2ebb76SJohn Baldwin static int alloc_iq_fl(struct vi_info *, struct sge_iq *, struct sge_fl *,
222bc14b14dSNavdeep Parhar     int, int);
223fe2ebb76SJohn Baldwin static int free_iq_fl(struct vi_info *, struct sge_iq *, struct sge_fl *);
224348694daSNavdeep Parhar static void add_iq_sysctls(struct sysctl_ctx_list *, struct sysctl_oid *,
225348694daSNavdeep Parhar     struct sge_iq *);
226aa93b99aSNavdeep Parhar static void add_fl_sysctls(struct adapter *, struct sysctl_ctx_list *,
227aa93b99aSNavdeep Parhar     struct sysctl_oid *, struct sge_fl *);
228733b9277SNavdeep Parhar static int alloc_fwq(struct adapter *);
229733b9277SNavdeep Parhar static int free_fwq(struct adapter *);
23037310a98SNavdeep Parhar static int alloc_ctrlq(struct adapter *, struct sge_wrq *, int,
23137310a98SNavdeep Parhar     struct sysctl_oid *);
232fe2ebb76SJohn Baldwin static int alloc_rxq(struct vi_info *, struct sge_rxq *, int, int,
233733b9277SNavdeep Parhar     struct sysctl_oid *);
234fe2ebb76SJohn Baldwin static int free_rxq(struct vi_info *, struct sge_rxq *);
23509fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
236fe2ebb76SJohn Baldwin static int alloc_ofld_rxq(struct vi_info *, struct sge_ofld_rxq *, int, int,
237733b9277SNavdeep Parhar     struct sysctl_oid *);
238fe2ebb76SJohn Baldwin static int free_ofld_rxq(struct vi_info *, struct sge_ofld_rxq *);
239733b9277SNavdeep Parhar #endif
240298d969cSNavdeep Parhar #ifdef DEV_NETMAP
241fe2ebb76SJohn Baldwin static int alloc_nm_rxq(struct vi_info *, struct sge_nm_rxq *, int, int,
242298d969cSNavdeep Parhar     struct sysctl_oid *);
243fe2ebb76SJohn Baldwin static int free_nm_rxq(struct vi_info *, struct sge_nm_rxq *);
244fe2ebb76SJohn Baldwin static int alloc_nm_txq(struct vi_info *, struct sge_nm_txq *, int, int,
245298d969cSNavdeep Parhar     struct sysctl_oid *);
246fe2ebb76SJohn Baldwin static int free_nm_txq(struct vi_info *, struct sge_nm_txq *);
247298d969cSNavdeep Parhar #endif
248733b9277SNavdeep Parhar static int ctrl_eq_alloc(struct adapter *, struct sge_eq *);
249fe2ebb76SJohn Baldwin static int eth_eq_alloc(struct adapter *, struct vi_info *, struct sge_eq *);
250eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
251fe2ebb76SJohn Baldwin static int ofld_eq_alloc(struct adapter *, struct vi_info *, struct sge_eq *);
252733b9277SNavdeep Parhar #endif
253fe2ebb76SJohn Baldwin static int alloc_eq(struct adapter *, struct vi_info *, struct sge_eq *);
254733b9277SNavdeep Parhar static int free_eq(struct adapter *, struct sge_eq *);
255fe2ebb76SJohn Baldwin static int alloc_wrq(struct adapter *, struct vi_info *, struct sge_wrq *,
256733b9277SNavdeep Parhar     struct sysctl_oid *);
257733b9277SNavdeep Parhar static int free_wrq(struct adapter *, struct sge_wrq *);
258fe2ebb76SJohn Baldwin static int alloc_txq(struct vi_info *, struct sge_txq *, int,
259733b9277SNavdeep Parhar     struct sysctl_oid *);
260fe2ebb76SJohn Baldwin static int free_txq(struct vi_info *, struct sge_txq *);
26154e4ee71SNavdeep Parhar static void oneseg_dma_callback(void *, bus_dma_segment_t *, int, int);
26254e4ee71SNavdeep Parhar static inline void ring_fl_db(struct adapter *, struct sge_fl *);
263733b9277SNavdeep Parhar static int refill_fl(struct adapter *, struct sge_fl *, int);
264733b9277SNavdeep Parhar static void refill_sfl(void *);
26554e4ee71SNavdeep Parhar static int alloc_fl_sdesc(struct sge_fl *);
2661458bff9SNavdeep Parhar static void free_fl_sdesc(struct adapter *, struct sge_fl *);
26738035ed6SNavdeep Parhar static void find_best_refill_source(struct adapter *, struct sge_fl *, int);
26838035ed6SNavdeep Parhar static void find_safe_refill_source(struct adapter *, struct sge_fl *);
269733b9277SNavdeep Parhar static void add_fl_to_sfl(struct adapter *, struct sge_fl *);
27054e4ee71SNavdeep Parhar 
2717951040fSNavdeep Parhar static inline void get_pkt_gl(struct mbuf *, struct sglist *);
2727951040fSNavdeep Parhar static inline u_int txpkt_len16(u_int, u_int);
2736af45170SJohn Baldwin static inline u_int txpkt_vm_len16(u_int, u_int);
2747951040fSNavdeep Parhar static inline u_int txpkts0_len16(u_int);
2757951040fSNavdeep Parhar static inline u_int txpkts1_len16(void);
276*5cdaef71SJohn Baldwin static u_int write_raw_wr(struct sge_txq *, void *, struct mbuf *, u_int);
2777951040fSNavdeep Parhar static u_int write_txpkt_wr(struct sge_txq *, struct fw_eth_tx_pkt_wr *,
2787951040fSNavdeep Parhar     struct mbuf *, u_int);
279472a6004SNavdeep Parhar static u_int write_txpkt_vm_wr(struct adapter *, struct sge_txq *,
280472a6004SNavdeep Parhar     struct fw_eth_tx_pkt_vm_wr *, struct mbuf *, u_int);
2817951040fSNavdeep Parhar static int try_txpkts(struct mbuf *, struct mbuf *, struct txpkts *, u_int);
2827951040fSNavdeep Parhar static int add_to_txpkts(struct mbuf *, struct txpkts *, u_int);
2837951040fSNavdeep Parhar static u_int write_txpkts_wr(struct sge_txq *, struct fw_eth_tx_pkts_wr *,
2847951040fSNavdeep Parhar     struct mbuf *, const struct txpkts *, u_int);
2857951040fSNavdeep Parhar static void write_gl_to_txd(struct sge_txq *, struct mbuf *, caddr_t *, int);
28654e4ee71SNavdeep Parhar static inline void copy_to_txd(struct sge_eq *, caddr_t, caddr_t *, int);
2877951040fSNavdeep Parhar static inline void ring_eq_db(struct adapter *, struct sge_eq *, u_int);
2887951040fSNavdeep Parhar static inline uint16_t read_hw_cidx(struct sge_eq *);
2897951040fSNavdeep Parhar static inline u_int reclaimable_tx_desc(struct sge_eq *);
2907951040fSNavdeep Parhar static inline u_int total_available_tx_desc(struct sge_eq *);
2917951040fSNavdeep Parhar static u_int reclaim_tx_descs(struct sge_txq *, u_int);
2927951040fSNavdeep Parhar static void tx_reclaim(void *, int);
2937951040fSNavdeep Parhar static __be64 get_flit(struct sglist_seg *, int, int);
294733b9277SNavdeep Parhar static int handle_sge_egr_update(struct sge_iq *, const struct rss_header *,
295733b9277SNavdeep Parhar     struct mbuf *);
2961b4cc91fSNavdeep Parhar static int handle_fw_msg(struct sge_iq *, const struct rss_header *,
297733b9277SNavdeep Parhar     struct mbuf *);
298069af0ebSJohn Baldwin static int t4_handle_wrerr_rpl(struct adapter *, const __be64 *);
2997951040fSNavdeep Parhar static void wrq_tx_drain(void *, int);
3007951040fSNavdeep Parhar static void drain_wrq_wr_list(struct adapter *, struct sge_wrq *);
30154e4ee71SNavdeep Parhar 
30256599263SNavdeep Parhar static int sysctl_uint16(SYSCTL_HANDLER_ARGS);
30338035ed6SNavdeep Parhar static int sysctl_bufsizes(SYSCTL_HANDLER_ARGS);
304786099deSNavdeep Parhar #ifdef RATELIMIT
305786099deSNavdeep Parhar static inline u_int txpkt_eo_len16(u_int, u_int, u_int);
306786099deSNavdeep Parhar static int ethofld_fw4_ack(struct sge_iq *, const struct rss_header *,
307786099deSNavdeep Parhar     struct mbuf *);
308786099deSNavdeep Parhar #endif
309f7dfe243SNavdeep Parhar 
31082eff304SNavdeep Parhar static counter_u64_t extfree_refs;
31182eff304SNavdeep Parhar static counter_u64_t extfree_rels;
31282eff304SNavdeep Parhar 
313671bf2b8SNavdeep Parhar an_handler_t t4_an_handler;
314671bf2b8SNavdeep Parhar fw_msg_handler_t t4_fw_msg_handler[NUM_FW6_TYPES];
315671bf2b8SNavdeep Parhar cpl_handler_t t4_cpl_handler[NUM_CPL_CMDS];
3164535e804SNavdeep Parhar cpl_handler_t set_tcb_rpl_handlers[NUM_CPL_COOKIES];
3174535e804SNavdeep Parhar cpl_handler_t l2t_write_rpl_handlers[NUM_CPL_COOKIES];
318111638bfSNavdeep Parhar cpl_handler_t act_open_rpl_handlers[NUM_CPL_COOKIES];
31989f651e7SNavdeep Parhar cpl_handler_t abort_rpl_rss_handlers[NUM_CPL_COOKIES];
3209c707b32SNavdeep Parhar cpl_handler_t fw4_ack_handlers[NUM_CPL_COOKIES];
321671bf2b8SNavdeep Parhar 
3224535e804SNavdeep Parhar void
323671bf2b8SNavdeep Parhar t4_register_an_handler(an_handler_t h)
324671bf2b8SNavdeep Parhar {
3254535e804SNavdeep Parhar 	uintptr_t *loc;
326671bf2b8SNavdeep Parhar 
3274535e804SNavdeep Parhar 	MPASS(h == NULL || t4_an_handler == NULL);
3284535e804SNavdeep Parhar 
329671bf2b8SNavdeep Parhar 	loc = (uintptr_t *)&t4_an_handler;
3304535e804SNavdeep Parhar 	atomic_store_rel_ptr(loc, (uintptr_t)h);
331671bf2b8SNavdeep Parhar }
332671bf2b8SNavdeep Parhar 
3334535e804SNavdeep Parhar void
334671bf2b8SNavdeep Parhar t4_register_fw_msg_handler(int type, fw_msg_handler_t h)
335671bf2b8SNavdeep Parhar {
3364535e804SNavdeep Parhar 	uintptr_t *loc;
337671bf2b8SNavdeep Parhar 
3384535e804SNavdeep Parhar 	MPASS(type < nitems(t4_fw_msg_handler));
3394535e804SNavdeep Parhar 	MPASS(h == NULL || t4_fw_msg_handler[type] == NULL);
340671bf2b8SNavdeep Parhar 	/*
341671bf2b8SNavdeep Parhar 	 * These are dispatched by the handler for FW{4|6}_CPL_MSG using the CPL
342671bf2b8SNavdeep Parhar 	 * handler dispatch table.  Reject any attempt to install a handler for
343671bf2b8SNavdeep Parhar 	 * this subtype.
344671bf2b8SNavdeep Parhar 	 */
3454535e804SNavdeep Parhar 	MPASS(type != FW_TYPE_RSSCPL);
3464535e804SNavdeep Parhar 	MPASS(type != FW6_TYPE_RSSCPL);
347671bf2b8SNavdeep Parhar 
348671bf2b8SNavdeep Parhar 	loc = (uintptr_t *)&t4_fw_msg_handler[type];
3494535e804SNavdeep Parhar 	atomic_store_rel_ptr(loc, (uintptr_t)h);
3504535e804SNavdeep Parhar }
351671bf2b8SNavdeep Parhar 
3524535e804SNavdeep Parhar void
3534535e804SNavdeep Parhar t4_register_cpl_handler(int opcode, cpl_handler_t h)
3544535e804SNavdeep Parhar {
3554535e804SNavdeep Parhar 	uintptr_t *loc;
3564535e804SNavdeep Parhar 
3574535e804SNavdeep Parhar 	MPASS(opcode < nitems(t4_cpl_handler));
3584535e804SNavdeep Parhar 	MPASS(h == NULL || t4_cpl_handler[opcode] == NULL);
3594535e804SNavdeep Parhar 
3604535e804SNavdeep Parhar 	loc = (uintptr_t *)&t4_cpl_handler[opcode];
3614535e804SNavdeep Parhar 	atomic_store_rel_ptr(loc, (uintptr_t)h);
362671bf2b8SNavdeep Parhar }
363671bf2b8SNavdeep Parhar 
364671bf2b8SNavdeep Parhar static int
3654535e804SNavdeep Parhar set_tcb_rpl_handler(struct sge_iq *iq, const struct rss_header *rss,
3664535e804SNavdeep Parhar     struct mbuf *m)
367671bf2b8SNavdeep Parhar {
3684535e804SNavdeep Parhar 	const struct cpl_set_tcb_rpl *cpl = (const void *)(rss + 1);
3694535e804SNavdeep Parhar 	u_int tid;
3704535e804SNavdeep Parhar 	int cookie;
371671bf2b8SNavdeep Parhar 
3724535e804SNavdeep Parhar 	MPASS(m == NULL);
3734535e804SNavdeep Parhar 
3744535e804SNavdeep Parhar 	tid = GET_TID(cpl);
3755fc0f72fSNavdeep Parhar 	if (is_hpftid(iq->adapter, tid) || is_ftid(iq->adapter, tid)) {
3764535e804SNavdeep Parhar 		/*
3774535e804SNavdeep Parhar 		 * The return code for filter-write is put in the CPL cookie so
3784535e804SNavdeep Parhar 		 * we have to rely on the hardware tid (is_ftid) to determine
3794535e804SNavdeep Parhar 		 * that this is a response to a filter.
3804535e804SNavdeep Parhar 		 */
3814535e804SNavdeep Parhar 		cookie = CPL_COOKIE_FILTER;
3824535e804SNavdeep Parhar 	} else {
3834535e804SNavdeep Parhar 		cookie = G_COOKIE(cpl->cookie);
3844535e804SNavdeep Parhar 	}
3854535e804SNavdeep Parhar 	MPASS(cookie > CPL_COOKIE_RESERVED);
3864535e804SNavdeep Parhar 	MPASS(cookie < nitems(set_tcb_rpl_handlers));
3874535e804SNavdeep Parhar 
3884535e804SNavdeep Parhar 	return (set_tcb_rpl_handlers[cookie](iq, rss, m));
389671bf2b8SNavdeep Parhar }
390671bf2b8SNavdeep Parhar 
3914535e804SNavdeep Parhar static int
3924535e804SNavdeep Parhar l2t_write_rpl_handler(struct sge_iq *iq, const struct rss_header *rss,
3934535e804SNavdeep Parhar     struct mbuf *m)
394671bf2b8SNavdeep Parhar {
3954535e804SNavdeep Parhar 	const struct cpl_l2t_write_rpl *rpl = (const void *)(rss + 1);
3964535e804SNavdeep Parhar 	unsigned int cookie;
397671bf2b8SNavdeep Parhar 
3984535e804SNavdeep Parhar 	MPASS(m == NULL);
399671bf2b8SNavdeep Parhar 
4004535e804SNavdeep Parhar 	cookie = GET_TID(rpl) & F_SYNC_WR ? CPL_COOKIE_TOM : CPL_COOKIE_FILTER;
4014535e804SNavdeep Parhar 	return (l2t_write_rpl_handlers[cookie](iq, rss, m));
4024535e804SNavdeep Parhar }
403671bf2b8SNavdeep Parhar 
404111638bfSNavdeep Parhar static int
405111638bfSNavdeep Parhar act_open_rpl_handler(struct sge_iq *iq, const struct rss_header *rss,
406111638bfSNavdeep Parhar     struct mbuf *m)
407111638bfSNavdeep Parhar {
408111638bfSNavdeep Parhar 	const struct cpl_act_open_rpl *cpl = (const void *)(rss + 1);
409111638bfSNavdeep Parhar 	u_int cookie = G_TID_COOKIE(G_AOPEN_ATID(be32toh(cpl->atid_status)));
410111638bfSNavdeep Parhar 
411111638bfSNavdeep Parhar 	MPASS(m == NULL);
412111638bfSNavdeep Parhar 	MPASS(cookie != CPL_COOKIE_RESERVED);
413111638bfSNavdeep Parhar 
414111638bfSNavdeep Parhar 	return (act_open_rpl_handlers[cookie](iq, rss, m));
415111638bfSNavdeep Parhar }
416111638bfSNavdeep Parhar 
41789f651e7SNavdeep Parhar static int
41889f651e7SNavdeep Parhar abort_rpl_rss_handler(struct sge_iq *iq, const struct rss_header *rss,
41989f651e7SNavdeep Parhar     struct mbuf *m)
42089f651e7SNavdeep Parhar {
42189f651e7SNavdeep Parhar 	struct adapter *sc = iq->adapter;
42289f651e7SNavdeep Parhar 	u_int cookie;
42389f651e7SNavdeep Parhar 
42489f651e7SNavdeep Parhar 	MPASS(m == NULL);
42589f651e7SNavdeep Parhar 	if (is_hashfilter(sc))
42689f651e7SNavdeep Parhar 		cookie = CPL_COOKIE_HASHFILTER;
42789f651e7SNavdeep Parhar 	else
42889f651e7SNavdeep Parhar 		cookie = CPL_COOKIE_TOM;
42989f651e7SNavdeep Parhar 
43089f651e7SNavdeep Parhar 	return (abort_rpl_rss_handlers[cookie](iq, rss, m));
43189f651e7SNavdeep Parhar }
43289f651e7SNavdeep Parhar 
4339c707b32SNavdeep Parhar static int
4349c707b32SNavdeep Parhar fw4_ack_handler(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m)
4359c707b32SNavdeep Parhar {
4369c707b32SNavdeep Parhar 	struct adapter *sc = iq->adapter;
4379c707b32SNavdeep Parhar 	const struct cpl_fw4_ack *cpl = (const void *)(rss + 1);
4389c707b32SNavdeep Parhar 	unsigned int tid = G_CPL_FW4_ACK_FLOWID(be32toh(OPCODE_TID(cpl)));
4399c707b32SNavdeep Parhar 	u_int cookie;
4409c707b32SNavdeep Parhar 
4419c707b32SNavdeep Parhar 	MPASS(m == NULL);
4429c707b32SNavdeep Parhar 	if (is_etid(sc, tid))
4439c707b32SNavdeep Parhar 		cookie = CPL_COOKIE_ETHOFLD;
4449c707b32SNavdeep Parhar 	else
4459c707b32SNavdeep Parhar 		cookie = CPL_COOKIE_TOM;
4469c707b32SNavdeep Parhar 
4479c707b32SNavdeep Parhar 	return (fw4_ack_handlers[cookie](iq, rss, m));
4489c707b32SNavdeep Parhar }
4499c707b32SNavdeep Parhar 
4504535e804SNavdeep Parhar static void
4514535e804SNavdeep Parhar t4_init_shared_cpl_handlers(void)
4524535e804SNavdeep Parhar {
4534535e804SNavdeep Parhar 
4544535e804SNavdeep Parhar 	t4_register_cpl_handler(CPL_SET_TCB_RPL, set_tcb_rpl_handler);
4554535e804SNavdeep Parhar 	t4_register_cpl_handler(CPL_L2T_WRITE_RPL, l2t_write_rpl_handler);
456111638bfSNavdeep Parhar 	t4_register_cpl_handler(CPL_ACT_OPEN_RPL, act_open_rpl_handler);
45789f651e7SNavdeep Parhar 	t4_register_cpl_handler(CPL_ABORT_RPL_RSS, abort_rpl_rss_handler);
4589c707b32SNavdeep Parhar 	t4_register_cpl_handler(CPL_FW4_ACK, fw4_ack_handler);
4594535e804SNavdeep Parhar }
4604535e804SNavdeep Parhar 
4614535e804SNavdeep Parhar void
4624535e804SNavdeep Parhar t4_register_shared_cpl_handler(int opcode, cpl_handler_t h, int cookie)
4634535e804SNavdeep Parhar {
4644535e804SNavdeep Parhar 	uintptr_t *loc;
4654535e804SNavdeep Parhar 
4664535e804SNavdeep Parhar 	MPASS(opcode < nitems(t4_cpl_handler));
4674535e804SNavdeep Parhar 	MPASS(cookie > CPL_COOKIE_RESERVED);
4684535e804SNavdeep Parhar 	MPASS(cookie < NUM_CPL_COOKIES);
4694535e804SNavdeep Parhar 	MPASS(t4_cpl_handler[opcode] != NULL);
4704535e804SNavdeep Parhar 
4714535e804SNavdeep Parhar 	switch (opcode) {
4724535e804SNavdeep Parhar 	case CPL_SET_TCB_RPL:
4734535e804SNavdeep Parhar 		loc = (uintptr_t *)&set_tcb_rpl_handlers[cookie];
4744535e804SNavdeep Parhar 		break;
4754535e804SNavdeep Parhar 	case CPL_L2T_WRITE_RPL:
4764535e804SNavdeep Parhar 		loc = (uintptr_t *)&l2t_write_rpl_handlers[cookie];
4774535e804SNavdeep Parhar 		break;
478111638bfSNavdeep Parhar 	case CPL_ACT_OPEN_RPL:
479111638bfSNavdeep Parhar 		loc = (uintptr_t *)&act_open_rpl_handlers[cookie];
480111638bfSNavdeep Parhar 		break;
48189f651e7SNavdeep Parhar 	case CPL_ABORT_RPL_RSS:
48289f651e7SNavdeep Parhar 		loc = (uintptr_t *)&abort_rpl_rss_handlers[cookie];
48389f651e7SNavdeep Parhar 		break;
4849c707b32SNavdeep Parhar 	case CPL_FW4_ACK:
4859c707b32SNavdeep Parhar 		loc = (uintptr_t *)&fw4_ack_handlers[cookie];
4869c707b32SNavdeep Parhar 		break;
4874535e804SNavdeep Parhar 	default:
4884535e804SNavdeep Parhar 		MPASS(0);
4894535e804SNavdeep Parhar 		return;
4904535e804SNavdeep Parhar 	}
4914535e804SNavdeep Parhar 	MPASS(h == NULL || *loc == (uintptr_t)NULL);
4924535e804SNavdeep Parhar 	atomic_store_rel_ptr(loc, (uintptr_t)h);
493671bf2b8SNavdeep Parhar }
494671bf2b8SNavdeep Parhar 
49594586193SNavdeep Parhar /*
4961458bff9SNavdeep Parhar  * Called on MOD_LOAD.  Validates and calculates the SGE tunables.
49794586193SNavdeep Parhar  */
49894586193SNavdeep Parhar void
49994586193SNavdeep Parhar t4_sge_modload(void)
50094586193SNavdeep Parhar {
5014defc81bSNavdeep Parhar 
5029fb8886bSNavdeep Parhar 	if (fl_pktshift < 0 || fl_pktshift > 7) {
5039fb8886bSNavdeep Parhar 		printf("Invalid hw.cxgbe.fl_pktshift value (%d),"
504518bca2cSNavdeep Parhar 		    " using 0 instead.\n", fl_pktshift);
505518bca2cSNavdeep Parhar 		fl_pktshift = 0;
5069fb8886bSNavdeep Parhar 	}
5079fb8886bSNavdeep Parhar 
5089fb8886bSNavdeep Parhar 	if (spg_len != 64 && spg_len != 128) {
5099fb8886bSNavdeep Parhar 		int len;
5109fb8886bSNavdeep Parhar 
5119fb8886bSNavdeep Parhar #if defined(__i386__) || defined(__amd64__)
5129fb8886bSNavdeep Parhar 		len = cpu_clflush_line_size > 64 ? 128 : 64;
5139fb8886bSNavdeep Parhar #else
5149fb8886bSNavdeep Parhar 		len = 64;
5159fb8886bSNavdeep Parhar #endif
5169fb8886bSNavdeep Parhar 		if (spg_len != -1) {
5179fb8886bSNavdeep Parhar 			printf("Invalid hw.cxgbe.spg_len value (%d),"
5189fb8886bSNavdeep Parhar 			    " using %d instead.\n", spg_len, len);
5199fb8886bSNavdeep Parhar 		}
5209fb8886bSNavdeep Parhar 		spg_len = len;
5219fb8886bSNavdeep Parhar 	}
5229fb8886bSNavdeep Parhar 
5239fb8886bSNavdeep Parhar 	if (cong_drop < -1 || cong_drop > 1) {
5249fb8886bSNavdeep Parhar 		printf("Invalid hw.cxgbe.cong_drop value (%d),"
5259fb8886bSNavdeep Parhar 		    " using 0 instead.\n", cong_drop);
5269fb8886bSNavdeep Parhar 		cong_drop = 0;
5279fb8886bSNavdeep Parhar 	}
52882eff304SNavdeep Parhar 
529d491f8caSNavdeep Parhar 	if (tscale != 1 && (tscale < 3 || tscale > 17)) {
530d491f8caSNavdeep Parhar 		printf("Invalid hw.cxgbe.tscale value (%d),"
531d491f8caSNavdeep Parhar 		    " using 1 instead.\n", tscale);
532d491f8caSNavdeep Parhar 		tscale = 1;
533d491f8caSNavdeep Parhar 	}
534d491f8caSNavdeep Parhar 
53582eff304SNavdeep Parhar 	extfree_refs = counter_u64_alloc(M_WAITOK);
53682eff304SNavdeep Parhar 	extfree_rels = counter_u64_alloc(M_WAITOK);
53782eff304SNavdeep Parhar 	counter_u64_zero(extfree_refs);
53882eff304SNavdeep Parhar 	counter_u64_zero(extfree_rels);
539671bf2b8SNavdeep Parhar 
5404535e804SNavdeep Parhar 	t4_init_shared_cpl_handlers();
541671bf2b8SNavdeep Parhar 	t4_register_cpl_handler(CPL_FW4_MSG, handle_fw_msg);
542671bf2b8SNavdeep Parhar 	t4_register_cpl_handler(CPL_FW6_MSG, handle_fw_msg);
543671bf2b8SNavdeep Parhar 	t4_register_cpl_handler(CPL_SGE_EGR_UPDATE, handle_sge_egr_update);
544671bf2b8SNavdeep Parhar 	t4_register_cpl_handler(CPL_RX_PKT, t4_eth_rx);
545786099deSNavdeep Parhar #ifdef RATELIMIT
546786099deSNavdeep Parhar 	t4_register_shared_cpl_handler(CPL_FW4_ACK, ethofld_fw4_ack,
547786099deSNavdeep Parhar 	    CPL_COOKIE_ETHOFLD);
548786099deSNavdeep Parhar #endif
549671bf2b8SNavdeep Parhar 	t4_register_fw_msg_handler(FW6_TYPE_CMD_RPL, t4_handle_fw_rpl);
550069af0ebSJohn Baldwin 	t4_register_fw_msg_handler(FW6_TYPE_WRERR_RPL, t4_handle_wrerr_rpl);
55182eff304SNavdeep Parhar }
55282eff304SNavdeep Parhar 
55382eff304SNavdeep Parhar void
55482eff304SNavdeep Parhar t4_sge_modunload(void)
55582eff304SNavdeep Parhar {
55682eff304SNavdeep Parhar 
55782eff304SNavdeep Parhar 	counter_u64_free(extfree_refs);
55882eff304SNavdeep Parhar 	counter_u64_free(extfree_rels);
55982eff304SNavdeep Parhar }
56082eff304SNavdeep Parhar 
56182eff304SNavdeep Parhar uint64_t
56282eff304SNavdeep Parhar t4_sge_extfree_refs(void)
56382eff304SNavdeep Parhar {
56482eff304SNavdeep Parhar 	uint64_t refs, rels;
56582eff304SNavdeep Parhar 
56682eff304SNavdeep Parhar 	rels = counter_u64_fetch(extfree_rels);
56782eff304SNavdeep Parhar 	refs = counter_u64_fetch(extfree_refs);
56882eff304SNavdeep Parhar 
56982eff304SNavdeep Parhar 	return (refs - rels);
57094586193SNavdeep Parhar }
57194586193SNavdeep Parhar 
572e3207e19SNavdeep Parhar static inline void
573e3207e19SNavdeep Parhar setup_pad_and_pack_boundaries(struct adapter *sc)
574e3207e19SNavdeep Parhar {
575e3207e19SNavdeep Parhar 	uint32_t v, m;
5760dbc6cfdSNavdeep Parhar 	int pad, pack, pad_shift;
577e3207e19SNavdeep Parhar 
5780dbc6cfdSNavdeep Parhar 	pad_shift = chip_id(sc) > CHELSIO_T5 ? X_T6_INGPADBOUNDARY_SHIFT :
5790dbc6cfdSNavdeep Parhar 	    X_INGPADBOUNDARY_SHIFT;
580e3207e19SNavdeep Parhar 	pad = fl_pad;
5810dbc6cfdSNavdeep Parhar 	if (fl_pad < (1 << pad_shift) ||
5820dbc6cfdSNavdeep Parhar 	    fl_pad > (1 << (pad_shift + M_INGPADBOUNDARY)) ||
5830dbc6cfdSNavdeep Parhar 	    !powerof2(fl_pad)) {
584e3207e19SNavdeep Parhar 		/*
585e3207e19SNavdeep Parhar 		 * If there is any chance that we might use buffer packing and
586e3207e19SNavdeep Parhar 		 * the chip is a T4, then pick 64 as the pad/pack boundary.  Set
5870dbc6cfdSNavdeep Parhar 		 * it to the minimum allowed in all other cases.
588e3207e19SNavdeep Parhar 		 */
5890dbc6cfdSNavdeep Parhar 		pad = is_t4(sc) && buffer_packing ? 64 : 1 << pad_shift;
590e3207e19SNavdeep Parhar 
591e3207e19SNavdeep Parhar 		/*
592e3207e19SNavdeep Parhar 		 * For fl_pad = 0 we'll still write a reasonable value to the
593e3207e19SNavdeep Parhar 		 * register but all the freelists will opt out of padding.
594e3207e19SNavdeep Parhar 		 * We'll complain here only if the user tried to set it to a
595e3207e19SNavdeep Parhar 		 * value greater than 0 that was invalid.
596e3207e19SNavdeep Parhar 		 */
597e3207e19SNavdeep Parhar 		if (fl_pad > 0) {
598e3207e19SNavdeep Parhar 			device_printf(sc->dev, "Invalid hw.cxgbe.fl_pad value"
599e3207e19SNavdeep Parhar 			    " (%d), using %d instead.\n", fl_pad, pad);
600e3207e19SNavdeep Parhar 		}
601e3207e19SNavdeep Parhar 	}
602e3207e19SNavdeep Parhar 	m = V_INGPADBOUNDARY(M_INGPADBOUNDARY);
6030dbc6cfdSNavdeep Parhar 	v = V_INGPADBOUNDARY(ilog2(pad) - pad_shift);
604e3207e19SNavdeep Parhar 	t4_set_reg_field(sc, A_SGE_CONTROL, m, v);
605e3207e19SNavdeep Parhar 
606e3207e19SNavdeep Parhar 	if (is_t4(sc)) {
607e3207e19SNavdeep Parhar 		if (fl_pack != -1 && fl_pack != pad) {
608e3207e19SNavdeep Parhar 			/* Complain but carry on. */
609e3207e19SNavdeep Parhar 			device_printf(sc->dev, "hw.cxgbe.fl_pack (%d) ignored,"
610e3207e19SNavdeep Parhar 			    " using %d instead.\n", fl_pack, pad);
611e3207e19SNavdeep Parhar 		}
612e3207e19SNavdeep Parhar 		return;
613e3207e19SNavdeep Parhar 	}
614e3207e19SNavdeep Parhar 
615e3207e19SNavdeep Parhar 	pack = fl_pack;
616e3207e19SNavdeep Parhar 	if (fl_pack < 16 || fl_pack == 32 || fl_pack > 4096 ||
617e3207e19SNavdeep Parhar 	    !powerof2(fl_pack)) {
618e3207e19SNavdeep Parhar 		pack = max(sc->params.pci.mps, CACHE_LINE_SIZE);
619e3207e19SNavdeep Parhar 		MPASS(powerof2(pack));
620e3207e19SNavdeep Parhar 		if (pack < 16)
621e3207e19SNavdeep Parhar 			pack = 16;
622e3207e19SNavdeep Parhar 		if (pack == 32)
623e3207e19SNavdeep Parhar 			pack = 64;
624e3207e19SNavdeep Parhar 		if (pack > 4096)
625e3207e19SNavdeep Parhar 			pack = 4096;
626e3207e19SNavdeep Parhar 		if (fl_pack != -1) {
627e3207e19SNavdeep Parhar 			device_printf(sc->dev, "Invalid hw.cxgbe.fl_pack value"
628e3207e19SNavdeep Parhar 			    " (%d), using %d instead.\n", fl_pack, pack);
629e3207e19SNavdeep Parhar 		}
630e3207e19SNavdeep Parhar 	}
631e3207e19SNavdeep Parhar 	m = V_INGPACKBOUNDARY(M_INGPACKBOUNDARY);
632e3207e19SNavdeep Parhar 	if (pack == 16)
633e3207e19SNavdeep Parhar 		v = V_INGPACKBOUNDARY(0);
634e3207e19SNavdeep Parhar 	else
635e3207e19SNavdeep Parhar 		v = V_INGPACKBOUNDARY(ilog2(pack) - 5);
636e3207e19SNavdeep Parhar 
637e3207e19SNavdeep Parhar 	MPASS(!is_t4(sc));	/* T4 doesn't have SGE_CONTROL2 */
638e3207e19SNavdeep Parhar 	t4_set_reg_field(sc, A_SGE_CONTROL2, m, v);
639e3207e19SNavdeep Parhar }
640e3207e19SNavdeep Parhar 
641cf738022SNavdeep Parhar /*
642cf738022SNavdeep Parhar  * adap->params.vpd.cclk must be set up before this is called.
643cf738022SNavdeep Parhar  */
644d14b0ac1SNavdeep Parhar void
645d14b0ac1SNavdeep Parhar t4_tweak_chip_settings(struct adapter *sc)
646d14b0ac1SNavdeep Parhar {
647d14b0ac1SNavdeep Parhar 	int i;
648d14b0ac1SNavdeep Parhar 	uint32_t v, m;
649d14b0ac1SNavdeep Parhar 	int intr_timer[SGE_NTIMERS] = {1, 5, 10, 50, 100, 200};
650cf738022SNavdeep Parhar 	int timer_max = M_TIMERVALUE0 * 1000 / sc->params.vpd.cclk;
651d14b0ac1SNavdeep Parhar 	int intr_pktcount[SGE_NCOUNTERS] = {1, 8, 16, 32}; /* 63 max */
652d14b0ac1SNavdeep Parhar 	uint16_t indsz = min(RX_COPY_THRESHOLD - 1, M_INDICATESIZE);
65338035ed6SNavdeep Parhar 	static int sge_flbuf_sizes[] = {
6541458bff9SNavdeep Parhar 		MCLBYTES,
6551458bff9SNavdeep Parhar #if MJUMPAGESIZE != MCLBYTES
6561458bff9SNavdeep Parhar 		MJUMPAGESIZE,
65738035ed6SNavdeep Parhar 		MJUMPAGESIZE - CL_METADATA_SIZE,
65838035ed6SNavdeep Parhar 		MJUMPAGESIZE - 2 * MSIZE - CL_METADATA_SIZE,
6591458bff9SNavdeep Parhar #endif
6601458bff9SNavdeep Parhar 		MJUM9BYTES,
6611458bff9SNavdeep Parhar 		MJUM16BYTES,
66238035ed6SNavdeep Parhar 		MCLBYTES - MSIZE - CL_METADATA_SIZE,
66338035ed6SNavdeep Parhar 		MJUM9BYTES - CL_METADATA_SIZE,
66438035ed6SNavdeep Parhar 		MJUM16BYTES - CL_METADATA_SIZE,
6651458bff9SNavdeep Parhar 	};
666d14b0ac1SNavdeep Parhar 
667d14b0ac1SNavdeep Parhar 	KASSERT(sc->flags & MASTER_PF,
668d14b0ac1SNavdeep Parhar 	    ("%s: trying to change chip settings when not master.", __func__));
669d14b0ac1SNavdeep Parhar 
6701458bff9SNavdeep Parhar 	m = V_PKTSHIFT(M_PKTSHIFT) | F_RXPKTCPLMODE | F_EGRSTATUSPAGESIZE;
671d14b0ac1SNavdeep Parhar 	v = V_PKTSHIFT(fl_pktshift) | F_RXPKTCPLMODE |
6724defc81bSNavdeep Parhar 	    V_EGRSTATUSPAGESIZE(spg_len == 128);
673d14b0ac1SNavdeep Parhar 	t4_set_reg_field(sc, A_SGE_CONTROL, m, v);
67454e4ee71SNavdeep Parhar 
675e3207e19SNavdeep Parhar 	setup_pad_and_pack_boundaries(sc);
6761458bff9SNavdeep Parhar 
677d14b0ac1SNavdeep Parhar 	v = V_HOSTPAGESIZEPF0(PAGE_SHIFT - 10) |
678733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF1(PAGE_SHIFT - 10) |
679733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF2(PAGE_SHIFT - 10) |
680733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF3(PAGE_SHIFT - 10) |
681733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF4(PAGE_SHIFT - 10) |
682733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF5(PAGE_SHIFT - 10) |
683733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF6(PAGE_SHIFT - 10) |
684733b9277SNavdeep Parhar 	    V_HOSTPAGESIZEPF7(PAGE_SHIFT - 10);
685d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_SGE_HOST_PAGE_SIZE, v);
686733b9277SNavdeep Parhar 
68738035ed6SNavdeep Parhar 	KASSERT(nitems(sge_flbuf_sizes) <= SGE_FLBUF_SIZES,
68838035ed6SNavdeep Parhar 	    ("%s: hw buffer size table too big", __func__));
68938035ed6SNavdeep Parhar 	for (i = 0; i < min(nitems(sge_flbuf_sizes), SGE_FLBUF_SIZES); i++) {
69054e4ee71SNavdeep Parhar 		t4_write_reg(sc, A_SGE_FL_BUFFER_SIZE0 + (4 * i),
69138035ed6SNavdeep Parhar 		    sge_flbuf_sizes[i]);
69254e4ee71SNavdeep Parhar 	}
69354e4ee71SNavdeep Parhar 
694d14b0ac1SNavdeep Parhar 	v = V_THRESHOLD_0(intr_pktcount[0]) | V_THRESHOLD_1(intr_pktcount[1]) |
695d14b0ac1SNavdeep Parhar 	    V_THRESHOLD_2(intr_pktcount[2]) | V_THRESHOLD_3(intr_pktcount[3]);
696d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_SGE_INGRESS_RX_THRESHOLD, v);
69754e4ee71SNavdeep Parhar 
698cf738022SNavdeep Parhar 	KASSERT(intr_timer[0] <= timer_max,
699cf738022SNavdeep Parhar 	    ("%s: not a single usable timer (%d, %d)", __func__, intr_timer[0],
700cf738022SNavdeep Parhar 	    timer_max));
701cf738022SNavdeep Parhar 	for (i = 1; i < nitems(intr_timer); i++) {
702cf738022SNavdeep Parhar 		KASSERT(intr_timer[i] >= intr_timer[i - 1],
703cf738022SNavdeep Parhar 		    ("%s: timers not listed in increasing order (%d)",
704cf738022SNavdeep Parhar 		    __func__, i));
705cf738022SNavdeep Parhar 
706cf738022SNavdeep Parhar 		while (intr_timer[i] > timer_max) {
707cf738022SNavdeep Parhar 			if (i == nitems(intr_timer) - 1) {
708cf738022SNavdeep Parhar 				intr_timer[i] = timer_max;
709cf738022SNavdeep Parhar 				break;
710cf738022SNavdeep Parhar 			}
711cf738022SNavdeep Parhar 			intr_timer[i] += intr_timer[i - 1];
712cf738022SNavdeep Parhar 			intr_timer[i] /= 2;
713cf738022SNavdeep Parhar 		}
714cf738022SNavdeep Parhar 	}
715cf738022SNavdeep Parhar 
716d14b0ac1SNavdeep Parhar 	v = V_TIMERVALUE0(us_to_core_ticks(sc, intr_timer[0])) |
717d14b0ac1SNavdeep Parhar 	    V_TIMERVALUE1(us_to_core_ticks(sc, intr_timer[1]));
718d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_SGE_TIMER_VALUE_0_AND_1, v);
719d14b0ac1SNavdeep Parhar 	v = V_TIMERVALUE2(us_to_core_ticks(sc, intr_timer[2])) |
720d14b0ac1SNavdeep Parhar 	    V_TIMERVALUE3(us_to_core_ticks(sc, intr_timer[3]));
721d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_SGE_TIMER_VALUE_2_AND_3, v);
722d14b0ac1SNavdeep Parhar 	v = V_TIMERVALUE4(us_to_core_ticks(sc, intr_timer[4])) |
723d14b0ac1SNavdeep Parhar 	    V_TIMERVALUE5(us_to_core_ticks(sc, intr_timer[5]));
724d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_SGE_TIMER_VALUE_4_AND_5, v);
72586e02bf2SNavdeep Parhar 
726d491f8caSNavdeep Parhar 	if (chip_id(sc) >= CHELSIO_T6) {
727d491f8caSNavdeep Parhar 		m = V_TSCALE(M_TSCALE);
728d491f8caSNavdeep Parhar 		if (tscale == 1)
729d491f8caSNavdeep Parhar 			v = 0;
730d491f8caSNavdeep Parhar 		else
731d491f8caSNavdeep Parhar 			v = V_TSCALE(tscale - 2);
732d491f8caSNavdeep Parhar 		t4_set_reg_field(sc, A_SGE_ITP_CONTROL, m, v);
7332f318252SNavdeep Parhar 
7342f318252SNavdeep Parhar 		if (sc->debug_flags & DF_DISABLE_TCB_CACHE) {
7352f318252SNavdeep Parhar 			m = V_RDTHRESHOLD(M_RDTHRESHOLD) | F_WRTHRTHRESHEN |
7362f318252SNavdeep Parhar 			    V_WRTHRTHRESH(M_WRTHRTHRESH);
7372f318252SNavdeep Parhar 			t4_tp_pio_read(sc, &v, 1, A_TP_CMM_CONFIG, 1);
7382f318252SNavdeep Parhar 			v &= ~m;
7392f318252SNavdeep Parhar 			v |= V_RDTHRESHOLD(1) | F_WRTHRTHRESHEN |
7402f318252SNavdeep Parhar 			    V_WRTHRTHRESH(16);
7412f318252SNavdeep Parhar 			t4_tp_pio_write(sc, &v, 1, A_TP_CMM_CONFIG, 1);
7422f318252SNavdeep Parhar 		}
743d491f8caSNavdeep Parhar 	}
744d491f8caSNavdeep Parhar 
7457cba15b1SNavdeep Parhar 	/* 4K, 16K, 64K, 256K DDP "page sizes" for TDDP */
746d14b0ac1SNavdeep Parhar 	v = V_HPZ0(0) | V_HPZ1(2) | V_HPZ2(4) | V_HPZ3(6);
747d14b0ac1SNavdeep Parhar 	t4_write_reg(sc, A_ULP_RX_TDDP_PSZ, v);
748d14b0ac1SNavdeep Parhar 
7497cba15b1SNavdeep Parhar 	/*
7507cba15b1SNavdeep Parhar 	 * 4K, 8K, 16K, 64K DDP "page sizes" for iSCSI DDP.  These have been
7517cba15b1SNavdeep Parhar 	 * chosen with MAXPHYS = 128K in mind.  The largest DDP buffer that we
7527cba15b1SNavdeep Parhar 	 * may have to deal with is MAXPHYS + 1 page.
7537cba15b1SNavdeep Parhar 	 */
7547cba15b1SNavdeep Parhar 	v = V_HPZ0(0) | V_HPZ1(1) | V_HPZ2(2) | V_HPZ3(4);
7557cba15b1SNavdeep Parhar 	t4_write_reg(sc, A_ULP_RX_ISCSI_PSZ, v);
7567cba15b1SNavdeep Parhar 
7577cba15b1SNavdeep Parhar 	/* We use multiple DDP page sizes both in plain-TOE and ISCSI modes. */
7587cba15b1SNavdeep Parhar 	m = v = F_TDDPTAGTCB | F_ISCSITAGTCB;
759d14b0ac1SNavdeep Parhar 	t4_set_reg_field(sc, A_ULP_RX_CTL, m, v);
760d14b0ac1SNavdeep Parhar 
761d14b0ac1SNavdeep Parhar 	m = V_INDICATESIZE(M_INDICATESIZE) | F_REARMDDPOFFSET |
762d14b0ac1SNavdeep Parhar 	    F_RESETDDPOFFSET;
763d14b0ac1SNavdeep Parhar 	v = V_INDICATESIZE(indsz) | F_REARMDDPOFFSET | F_RESETDDPOFFSET;
764d14b0ac1SNavdeep Parhar 	t4_set_reg_field(sc, A_TP_PARA_REG5, m, v);
765d14b0ac1SNavdeep Parhar }
766d14b0ac1SNavdeep Parhar 
767d14b0ac1SNavdeep Parhar /*
768e3207e19SNavdeep Parhar  * SGE wants the buffer to be at least 64B and then a multiple of 16.  If
7698f6690d3SJohn Baldwin  * padding is in use, the buffer's start and end need to be aligned to the pad
770b741402cSNavdeep Parhar  * boundary as well.  We'll just make sure that the size is a multiple of the
771b741402cSNavdeep Parhar  * boundary here, it is up to the buffer allocation code to make sure the start
772b741402cSNavdeep Parhar  * of the buffer is aligned as well.
77338035ed6SNavdeep Parhar  */
77438035ed6SNavdeep Parhar static inline int
775e3207e19SNavdeep Parhar hwsz_ok(struct adapter *sc, int hwsz)
77638035ed6SNavdeep Parhar {
77790e7434aSNavdeep Parhar 	int mask = fl_pad ? sc->params.sge.pad_boundary - 1 : 16 - 1;
77838035ed6SNavdeep Parhar 
779b741402cSNavdeep Parhar 	return (hwsz >= 64 && (hwsz & mask) == 0);
78038035ed6SNavdeep Parhar }
78138035ed6SNavdeep Parhar 
78238035ed6SNavdeep Parhar /*
783d14b0ac1SNavdeep Parhar  * XXX: driver really should be able to deal with unexpected settings.
784d14b0ac1SNavdeep Parhar  */
785d14b0ac1SNavdeep Parhar int
786d14b0ac1SNavdeep Parhar t4_read_chip_settings(struct adapter *sc)
787d14b0ac1SNavdeep Parhar {
788d14b0ac1SNavdeep Parhar 	struct sge *s = &sc->sge;
78990e7434aSNavdeep Parhar 	struct sge_params *sp = &sc->params.sge;
7901458bff9SNavdeep Parhar 	int i, j, n, rc = 0;
791d14b0ac1SNavdeep Parhar 	uint32_t m, v, r;
792d14b0ac1SNavdeep Parhar 	uint16_t indsz = min(RX_COPY_THRESHOLD - 1, M_INDICATESIZE);
79338035ed6SNavdeep Parhar 	static int sw_buf_sizes[] = {	/* Sorted by size */
7941458bff9SNavdeep Parhar 		MCLBYTES,
7951458bff9SNavdeep Parhar #if MJUMPAGESIZE != MCLBYTES
7961458bff9SNavdeep Parhar 		MJUMPAGESIZE,
7971458bff9SNavdeep Parhar #endif
7981458bff9SNavdeep Parhar 		MJUM9BYTES,
7991458bff9SNavdeep Parhar 		MJUM16BYTES
8001458bff9SNavdeep Parhar 	};
80138035ed6SNavdeep Parhar 	struct sw_zone_info *swz, *safe_swz;
80238035ed6SNavdeep Parhar 	struct hw_buf_info *hwb;
803d14b0ac1SNavdeep Parhar 
80490e7434aSNavdeep Parhar 	m = F_RXPKTCPLMODE;
80590e7434aSNavdeep Parhar 	v = F_RXPKTCPLMODE;
80659c1e950SJohn Baldwin 	r = sc->params.sge.sge_control;
807d14b0ac1SNavdeep Parhar 	if ((r & m) != v) {
808d14b0ac1SNavdeep Parhar 		device_printf(sc->dev, "invalid SGE_CONTROL(0x%x)\n", r);
809733b9277SNavdeep Parhar 		rc = EINVAL;
810733b9277SNavdeep Parhar 	}
811733b9277SNavdeep Parhar 
81290e7434aSNavdeep Parhar 	/*
81390e7434aSNavdeep Parhar 	 * If this changes then every single use of PAGE_SHIFT in the driver
81490e7434aSNavdeep Parhar 	 * needs to be carefully reviewed for PAGE_SHIFT vs sp->page_shift.
81590e7434aSNavdeep Parhar 	 */
81690e7434aSNavdeep Parhar 	if (sp->page_shift != PAGE_SHIFT) {
817d14b0ac1SNavdeep Parhar 		device_printf(sc->dev, "invalid SGE_HOST_PAGE_SIZE(0x%x)\n", r);
818733b9277SNavdeep Parhar 		rc = EINVAL;
819733b9277SNavdeep Parhar 	}
820733b9277SNavdeep Parhar 
82138035ed6SNavdeep Parhar 	/* Filter out unusable hw buffer sizes entirely (mark with -2). */
82238035ed6SNavdeep Parhar 	hwb = &s->hw_buf_info[0];
82338035ed6SNavdeep Parhar 	for (i = 0; i < nitems(s->hw_buf_info); i++, hwb++) {
82459c1e950SJohn Baldwin 		r = sc->params.sge.sge_fl_buffer_size[i];
82538035ed6SNavdeep Parhar 		hwb->size = r;
826e3207e19SNavdeep Parhar 		hwb->zidx = hwsz_ok(sc, r) ? -1 : -2;
82738035ed6SNavdeep Parhar 		hwb->next = -1;
8281458bff9SNavdeep Parhar 	}
82938035ed6SNavdeep Parhar 
83038035ed6SNavdeep Parhar 	/*
83138035ed6SNavdeep Parhar 	 * Create a sorted list in decreasing order of hw buffer sizes (and so
83238035ed6SNavdeep Parhar 	 * increasing order of spare area) for each software zone.
833e3207e19SNavdeep Parhar 	 *
834e3207e19SNavdeep Parhar 	 * If padding is enabled then the start and end of the buffer must align
835e3207e19SNavdeep Parhar 	 * to the pad boundary; if packing is enabled then they must align with
836e3207e19SNavdeep Parhar 	 * the pack boundary as well.  Allocations from the cluster zones are
837e3207e19SNavdeep Parhar 	 * aligned to min(size, 4K), so the buffer starts at that alignment and
838e3207e19SNavdeep Parhar 	 * ends at hwb->size alignment.  If mbuf inlining is allowed the
839e3207e19SNavdeep Parhar 	 * starting alignment will be reduced to MSIZE and the driver will
840e3207e19SNavdeep Parhar 	 * exercise appropriate caution when deciding on the best buffer layout
841e3207e19SNavdeep Parhar 	 * to use.
84238035ed6SNavdeep Parhar 	 */
84338035ed6SNavdeep Parhar 	n = 0;	/* no usable buffer size to begin with */
84438035ed6SNavdeep Parhar 	swz = &s->sw_zone_info[0];
84538035ed6SNavdeep Parhar 	safe_swz = NULL;
84638035ed6SNavdeep Parhar 	for (i = 0; i < SW_ZONE_SIZES; i++, swz++) {
84738035ed6SNavdeep Parhar 		int8_t head = -1, tail = -1;
84838035ed6SNavdeep Parhar 
84938035ed6SNavdeep Parhar 		swz->size = sw_buf_sizes[i];
85038035ed6SNavdeep Parhar 		swz->zone = m_getzone(swz->size);
85138035ed6SNavdeep Parhar 		swz->type = m_gettype(swz->size);
85238035ed6SNavdeep Parhar 
853e3207e19SNavdeep Parhar 		if (swz->size < PAGE_SIZE) {
854e3207e19SNavdeep Parhar 			MPASS(powerof2(swz->size));
85590e7434aSNavdeep Parhar 			if (fl_pad && (swz->size % sp->pad_boundary != 0))
856e3207e19SNavdeep Parhar 				continue;
857e3207e19SNavdeep Parhar 		}
858e3207e19SNavdeep Parhar 
85938035ed6SNavdeep Parhar 		if (swz->size == safest_rx_cluster)
86038035ed6SNavdeep Parhar 			safe_swz = swz;
86138035ed6SNavdeep Parhar 
86238035ed6SNavdeep Parhar 		hwb = &s->hw_buf_info[0];
86338035ed6SNavdeep Parhar 		for (j = 0; j < SGE_FLBUF_SIZES; j++, hwb++) {
86438035ed6SNavdeep Parhar 			if (hwb->zidx != -1 || hwb->size > swz->size)
8651458bff9SNavdeep Parhar 				continue;
866e3207e19SNavdeep Parhar #ifdef INVARIANTS
867e3207e19SNavdeep Parhar 			if (fl_pad)
86890e7434aSNavdeep Parhar 				MPASS(hwb->size % sp->pad_boundary == 0);
869e3207e19SNavdeep Parhar #endif
87038035ed6SNavdeep Parhar 			hwb->zidx = i;
87138035ed6SNavdeep Parhar 			if (head == -1)
87238035ed6SNavdeep Parhar 				head = tail = j;
87338035ed6SNavdeep Parhar 			else if (hwb->size < s->hw_buf_info[tail].size) {
87438035ed6SNavdeep Parhar 				s->hw_buf_info[tail].next = j;
87538035ed6SNavdeep Parhar 				tail = j;
87638035ed6SNavdeep Parhar 			} else {
87738035ed6SNavdeep Parhar 				int8_t *cur;
87838035ed6SNavdeep Parhar 				struct hw_buf_info *t;
87938035ed6SNavdeep Parhar 
88038035ed6SNavdeep Parhar 				for (cur = &head; *cur != -1; cur = &t->next) {
88138035ed6SNavdeep Parhar 					t = &s->hw_buf_info[*cur];
88238035ed6SNavdeep Parhar 					if (hwb->size == t->size) {
88338035ed6SNavdeep Parhar 						hwb->zidx = -2;
8841458bff9SNavdeep Parhar 						break;
8851458bff9SNavdeep Parhar 					}
88638035ed6SNavdeep Parhar 					if (hwb->size > t->size) {
88738035ed6SNavdeep Parhar 						hwb->next = *cur;
88838035ed6SNavdeep Parhar 						*cur = j;
88938035ed6SNavdeep Parhar 						break;
89038035ed6SNavdeep Parhar 					}
89138035ed6SNavdeep Parhar 				}
89238035ed6SNavdeep Parhar 			}
89338035ed6SNavdeep Parhar 		}
89438035ed6SNavdeep Parhar 		swz->head_hwidx = head;
89538035ed6SNavdeep Parhar 		swz->tail_hwidx = tail;
89638035ed6SNavdeep Parhar 
89738035ed6SNavdeep Parhar 		if (tail != -1) {
89838035ed6SNavdeep Parhar 			n++;
89938035ed6SNavdeep Parhar 			if (swz->size - s->hw_buf_info[tail].size >=
90038035ed6SNavdeep Parhar 			    CL_METADATA_SIZE)
90138035ed6SNavdeep Parhar 				sc->flags |= BUF_PACKING_OK;
90238035ed6SNavdeep Parhar 		}
9031458bff9SNavdeep Parhar 	}
9041458bff9SNavdeep Parhar 	if (n == 0) {
9051458bff9SNavdeep Parhar 		device_printf(sc->dev, "no usable SGE FL buffer size.\n");
9061458bff9SNavdeep Parhar 		rc = EINVAL;
907733b9277SNavdeep Parhar 	}
90838035ed6SNavdeep Parhar 
90938035ed6SNavdeep Parhar 	s->safe_hwidx1 = -1;
91038035ed6SNavdeep Parhar 	s->safe_hwidx2 = -1;
91138035ed6SNavdeep Parhar 	if (safe_swz != NULL) {
91238035ed6SNavdeep Parhar 		s->safe_hwidx1 = safe_swz->head_hwidx;
91338035ed6SNavdeep Parhar 		for (i = safe_swz->head_hwidx; i != -1; i = hwb->next) {
91438035ed6SNavdeep Parhar 			int spare;
91538035ed6SNavdeep Parhar 
91638035ed6SNavdeep Parhar 			hwb = &s->hw_buf_info[i];
917e3207e19SNavdeep Parhar #ifdef INVARIANTS
918e3207e19SNavdeep Parhar 			if (fl_pad)
91990e7434aSNavdeep Parhar 				MPASS(hwb->size % sp->pad_boundary == 0);
920e3207e19SNavdeep Parhar #endif
92138035ed6SNavdeep Parhar 			spare = safe_swz->size - hwb->size;
922e3207e19SNavdeep Parhar 			if (spare >= CL_METADATA_SIZE) {
92338035ed6SNavdeep Parhar 				s->safe_hwidx2 = i;
92438035ed6SNavdeep Parhar 				break;
92538035ed6SNavdeep Parhar 			}
92638035ed6SNavdeep Parhar 		}
927e3207e19SNavdeep Parhar 	}
928733b9277SNavdeep Parhar 
9296af45170SJohn Baldwin 	if (sc->flags & IS_VF)
9306af45170SJohn Baldwin 		return (0);
9316af45170SJohn Baldwin 
932d14b0ac1SNavdeep Parhar 	v = V_HPZ0(0) | V_HPZ1(2) | V_HPZ2(4) | V_HPZ3(6);
933d14b0ac1SNavdeep Parhar 	r = t4_read_reg(sc, A_ULP_RX_TDDP_PSZ);
934d14b0ac1SNavdeep Parhar 	if (r != v) {
935d14b0ac1SNavdeep Parhar 		device_printf(sc->dev, "invalid ULP_RX_TDDP_PSZ(0x%x)\n", r);
936d14b0ac1SNavdeep Parhar 		rc = EINVAL;
937d14b0ac1SNavdeep Parhar 	}
938733b9277SNavdeep Parhar 
939d14b0ac1SNavdeep Parhar 	m = v = F_TDDPTAGTCB;
940d14b0ac1SNavdeep Parhar 	r = t4_read_reg(sc, A_ULP_RX_CTL);
941d14b0ac1SNavdeep Parhar 	if ((r & m) != v) {
942d14b0ac1SNavdeep Parhar 		device_printf(sc->dev, "invalid ULP_RX_CTL(0x%x)\n", r);
943d14b0ac1SNavdeep Parhar 		rc = EINVAL;
944d14b0ac1SNavdeep Parhar 	}
945d14b0ac1SNavdeep Parhar 
946d14b0ac1SNavdeep Parhar 	m = V_INDICATESIZE(M_INDICATESIZE) | F_REARMDDPOFFSET |
947d14b0ac1SNavdeep Parhar 	    F_RESETDDPOFFSET;
948d14b0ac1SNavdeep Parhar 	v = V_INDICATESIZE(indsz) | F_REARMDDPOFFSET | F_RESETDDPOFFSET;
949d14b0ac1SNavdeep Parhar 	r = t4_read_reg(sc, A_TP_PARA_REG5);
950d14b0ac1SNavdeep Parhar 	if ((r & m) != v) {
951d14b0ac1SNavdeep Parhar 		device_printf(sc->dev, "invalid TP_PARA_REG5(0x%x)\n", r);
952d14b0ac1SNavdeep Parhar 		rc = EINVAL;
953d14b0ac1SNavdeep Parhar 	}
954d14b0ac1SNavdeep Parhar 
955c45b1868SNavdeep Parhar 	t4_init_tp_params(sc, 1);
956d14b0ac1SNavdeep Parhar 
957d14b0ac1SNavdeep Parhar 	t4_read_mtu_tbl(sc, sc->params.mtus, NULL);
958d14b0ac1SNavdeep Parhar 	t4_load_mtus(sc, sc->params.mtus, sc->params.a_wnd, sc->params.b_wnd);
959d14b0ac1SNavdeep Parhar 
960733b9277SNavdeep Parhar 	return (rc);
96154e4ee71SNavdeep Parhar }
96254e4ee71SNavdeep Parhar 
96354e4ee71SNavdeep Parhar int
96454e4ee71SNavdeep Parhar t4_create_dma_tag(struct adapter *sc)
96554e4ee71SNavdeep Parhar {
96654e4ee71SNavdeep Parhar 	int rc;
96754e4ee71SNavdeep Parhar 
96854e4ee71SNavdeep Parhar 	rc = bus_dma_tag_create(bus_get_dma_tag(sc->dev), 1, 0,
96954e4ee71SNavdeep Parhar 	    BUS_SPACE_MAXADDR, BUS_SPACE_MAXADDR, NULL, NULL, BUS_SPACE_MAXSIZE,
97054e4ee71SNavdeep Parhar 	    BUS_SPACE_UNRESTRICTED, BUS_SPACE_MAXSIZE, BUS_DMA_ALLOCNOW, NULL,
97154e4ee71SNavdeep Parhar 	    NULL, &sc->dmat);
97254e4ee71SNavdeep Parhar 	if (rc != 0) {
97354e4ee71SNavdeep Parhar 		device_printf(sc->dev,
97454e4ee71SNavdeep Parhar 		    "failed to create main DMA tag: %d\n", rc);
97554e4ee71SNavdeep Parhar 	}
97654e4ee71SNavdeep Parhar 
97754e4ee71SNavdeep Parhar 	return (rc);
97854e4ee71SNavdeep Parhar }
97954e4ee71SNavdeep Parhar 
9806e22f9f3SNavdeep Parhar void
9816e22f9f3SNavdeep Parhar t4_sge_sysctls(struct adapter *sc, struct sysctl_ctx_list *ctx,
9826e22f9f3SNavdeep Parhar     struct sysctl_oid_list *children)
9836e22f9f3SNavdeep Parhar {
98490e7434aSNavdeep Parhar 	struct sge_params *sp = &sc->params.sge;
9856e22f9f3SNavdeep Parhar 
98638035ed6SNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "buffer_sizes",
98738035ed6SNavdeep Parhar 	    CTLTYPE_STRING | CTLFLAG_RD, &sc->sge, 0, sysctl_bufsizes, "A",
98838035ed6SNavdeep Parhar 	    "freelist buffer sizes");
98938035ed6SNavdeep Parhar 
9906e22f9f3SNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "fl_pktshift", CTLFLAG_RD,
99190e7434aSNavdeep Parhar 	    NULL, sp->fl_pktshift, "payload DMA offset in rx buffer (bytes)");
9926e22f9f3SNavdeep Parhar 
9936e22f9f3SNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "fl_pad", CTLFLAG_RD,
99490e7434aSNavdeep Parhar 	    NULL, sp->pad_boundary, "payload pad boundary (bytes)");
9956e22f9f3SNavdeep Parhar 
9966e22f9f3SNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "spg_len", CTLFLAG_RD,
99790e7434aSNavdeep Parhar 	    NULL, sp->spg_len, "status page size (bytes)");
9986e22f9f3SNavdeep Parhar 
9996e22f9f3SNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "cong_drop", CTLFLAG_RD,
10006e22f9f3SNavdeep Parhar 	    NULL, cong_drop, "congestion drop setting");
10011458bff9SNavdeep Parhar 
10021458bff9SNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "fl_pack", CTLFLAG_RD,
100390e7434aSNavdeep Parhar 	    NULL, sp->pack_boundary, "payload pack boundary (bytes)");
10046e22f9f3SNavdeep Parhar }
10056e22f9f3SNavdeep Parhar 
100654e4ee71SNavdeep Parhar int
100754e4ee71SNavdeep Parhar t4_destroy_dma_tag(struct adapter *sc)
100854e4ee71SNavdeep Parhar {
100954e4ee71SNavdeep Parhar 	if (sc->dmat)
101054e4ee71SNavdeep Parhar 		bus_dma_tag_destroy(sc->dmat);
101154e4ee71SNavdeep Parhar 
101254e4ee71SNavdeep Parhar 	return (0);
101354e4ee71SNavdeep Parhar }
101454e4ee71SNavdeep Parhar 
101554e4ee71SNavdeep Parhar /*
101637310a98SNavdeep Parhar  * Allocate and initialize the firmware event queue, control queues, and special
101737310a98SNavdeep Parhar  * purpose rx queues owned by the adapter.
101854e4ee71SNavdeep Parhar  *
101954e4ee71SNavdeep Parhar  * Returns errno on failure.  Resources allocated up to that point may still be
102054e4ee71SNavdeep Parhar  * allocated.  Caller is responsible for cleanup in case this function fails.
102154e4ee71SNavdeep Parhar  */
102254e4ee71SNavdeep Parhar int
1023f7dfe243SNavdeep Parhar t4_setup_adapter_queues(struct adapter *sc)
102454e4ee71SNavdeep Parhar {
102537310a98SNavdeep Parhar 	struct sysctl_oid *oid;
102637310a98SNavdeep Parhar 	struct sysctl_oid_list *children;
102737310a98SNavdeep Parhar 	int rc, i;
102854e4ee71SNavdeep Parhar 
102954e4ee71SNavdeep Parhar 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
103054e4ee71SNavdeep Parhar 
1031733b9277SNavdeep Parhar 	sysctl_ctx_init(&sc->ctx);
1032733b9277SNavdeep Parhar 	sc->flags |= ADAP_SYSCTL_CTX;
103354e4ee71SNavdeep Parhar 
103456599263SNavdeep Parhar 	/*
103556599263SNavdeep Parhar 	 * Firmware event queue
103656599263SNavdeep Parhar 	 */
1037733b9277SNavdeep Parhar 	rc = alloc_fwq(sc);
1038aa95b653SNavdeep Parhar 	if (rc != 0)
1039f7dfe243SNavdeep Parhar 		return (rc);
1040f7dfe243SNavdeep Parhar 
1041f7dfe243SNavdeep Parhar 	/*
104237310a98SNavdeep Parhar 	 * That's all for the VF driver.
1043f7dfe243SNavdeep Parhar 	 */
104437310a98SNavdeep Parhar 	if (sc->flags & IS_VF)
104537310a98SNavdeep Parhar 		return (rc);
104637310a98SNavdeep Parhar 
104737310a98SNavdeep Parhar 	oid = device_get_sysctl_tree(sc->dev);
104837310a98SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
104937310a98SNavdeep Parhar 
105037310a98SNavdeep Parhar 	/*
105137310a98SNavdeep Parhar 	 * XXX: General purpose rx queues, one per port.
105237310a98SNavdeep Parhar 	 */
105337310a98SNavdeep Parhar 
105437310a98SNavdeep Parhar 	/*
105537310a98SNavdeep Parhar 	 * Control queues, one per port.
105637310a98SNavdeep Parhar 	 */
105737310a98SNavdeep Parhar 	oid = SYSCTL_ADD_NODE(&sc->ctx, children, OID_AUTO, "ctrlq",
105837310a98SNavdeep Parhar 	    CTLFLAG_RD, NULL, "control queues");
105937310a98SNavdeep Parhar 	for_each_port(sc, i) {
106037310a98SNavdeep Parhar 		struct sge_wrq *ctrlq = &sc->sge.ctrlq[i];
106137310a98SNavdeep Parhar 
106237310a98SNavdeep Parhar 		rc = alloc_ctrlq(sc, ctrlq, i, oid);
106337310a98SNavdeep Parhar 		if (rc != 0)
106437310a98SNavdeep Parhar 			return (rc);
106537310a98SNavdeep Parhar 	}
106654e4ee71SNavdeep Parhar 
106754e4ee71SNavdeep Parhar 	return (rc);
106854e4ee71SNavdeep Parhar }
106954e4ee71SNavdeep Parhar 
107054e4ee71SNavdeep Parhar /*
107154e4ee71SNavdeep Parhar  * Idempotent
107254e4ee71SNavdeep Parhar  */
107354e4ee71SNavdeep Parhar int
1074f7dfe243SNavdeep Parhar t4_teardown_adapter_queues(struct adapter *sc)
107554e4ee71SNavdeep Parhar {
107637310a98SNavdeep Parhar 	int i;
107754e4ee71SNavdeep Parhar 
107854e4ee71SNavdeep Parhar 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
107954e4ee71SNavdeep Parhar 
1080733b9277SNavdeep Parhar 	/* Do this before freeing the queue */
1081733b9277SNavdeep Parhar 	if (sc->flags & ADAP_SYSCTL_CTX) {
1082f7dfe243SNavdeep Parhar 		sysctl_ctx_free(&sc->ctx);
1083733b9277SNavdeep Parhar 		sc->flags &= ~ADAP_SYSCTL_CTX;
1084f7dfe243SNavdeep Parhar 	}
1085f7dfe243SNavdeep Parhar 
1086b8bfcb71SNavdeep Parhar 	if (!(sc->flags & IS_VF)) {
108737310a98SNavdeep Parhar 		for_each_port(sc, i)
108837310a98SNavdeep Parhar 			free_wrq(sc, &sc->sge.ctrlq[i]);
1089b8bfcb71SNavdeep Parhar 	}
1090733b9277SNavdeep Parhar 	free_fwq(sc);
109154e4ee71SNavdeep Parhar 
109254e4ee71SNavdeep Parhar 	return (0);
109354e4ee71SNavdeep Parhar }
109454e4ee71SNavdeep Parhar 
109538035ed6SNavdeep Parhar /* Maximum payload that can be delivered with a single iq descriptor */
10968340ece5SNavdeep Parhar static inline int
109738035ed6SNavdeep Parhar mtu_to_max_payload(struct adapter *sc, int mtu, const int toe)
10988340ece5SNavdeep Parhar {
109938035ed6SNavdeep Parhar 	int payload;
11008340ece5SNavdeep Parhar 
11016eb3180fSNavdeep Parhar #ifdef TCP_OFFLOAD
110238035ed6SNavdeep Parhar 	if (toe) {
11031131c927SNavdeep Parhar 		int rxcs = G_RXCOALESCESIZE(t4_read_reg(sc, A_TP_PARA_REG2));
11041131c927SNavdeep Parhar 
11051131c927SNavdeep Parhar 		/* Note that COP can set rx_coalesce on/off per connection. */
11061131c927SNavdeep Parhar 		payload = max(mtu, rxcs);
110738035ed6SNavdeep Parhar 	} else {
110838035ed6SNavdeep Parhar #endif
110938035ed6SNavdeep Parhar 		/* large enough even when hw VLAN extraction is disabled */
111090e7434aSNavdeep Parhar 		payload = sc->params.sge.fl_pktshift + ETHER_HDR_LEN +
111190e7434aSNavdeep Parhar 		    ETHER_VLAN_ENCAP_LEN + mtu;
111238035ed6SNavdeep Parhar #ifdef TCP_OFFLOAD
11136eb3180fSNavdeep Parhar 	}
11146eb3180fSNavdeep Parhar #endif
111538035ed6SNavdeep Parhar 
111638035ed6SNavdeep Parhar 	return (payload);
111738035ed6SNavdeep Parhar }
11186eb3180fSNavdeep Parhar 
1119733b9277SNavdeep Parhar int
1120fe2ebb76SJohn Baldwin t4_setup_vi_queues(struct vi_info *vi)
1121733b9277SNavdeep Parhar {
1122f549e352SNavdeep Parhar 	int rc = 0, i, intr_idx, iqidx;
1123733b9277SNavdeep Parhar 	struct sge_rxq *rxq;
1124733b9277SNavdeep Parhar 	struct sge_txq *txq;
112509fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
1126733b9277SNavdeep Parhar 	struct sge_ofld_rxq *ofld_rxq;
1127eff62dbaSNavdeep Parhar #endif
1128eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
1129733b9277SNavdeep Parhar 	struct sge_wrq *ofld_txq;
1130298d969cSNavdeep Parhar #endif
1131298d969cSNavdeep Parhar #ifdef DEV_NETMAP
113262291463SNavdeep Parhar 	int saved_idx;
1133298d969cSNavdeep Parhar 	struct sge_nm_rxq *nm_rxq;
1134298d969cSNavdeep Parhar 	struct sge_nm_txq *nm_txq;
1135733b9277SNavdeep Parhar #endif
1136733b9277SNavdeep Parhar 	char name[16];
1137fe2ebb76SJohn Baldwin 	struct port_info *pi = vi->pi;
1138733b9277SNavdeep Parhar 	struct adapter *sc = pi->adapter;
1139fe2ebb76SJohn Baldwin 	struct ifnet *ifp = vi->ifp;
1140fe2ebb76SJohn Baldwin 	struct sysctl_oid *oid = device_get_sysctl_tree(vi->dev);
1141733b9277SNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
1142e3207e19SNavdeep Parhar 	int maxp, mtu = ifp->if_mtu;
1143733b9277SNavdeep Parhar 
1144733b9277SNavdeep Parhar 	/* Interrupt vector to start from (when using multiple vectors) */
1145f549e352SNavdeep Parhar 	intr_idx = vi->first_intr;
1146fe2ebb76SJohn Baldwin 
1147fe2ebb76SJohn Baldwin #ifdef DEV_NETMAP
114862291463SNavdeep Parhar 	saved_idx = intr_idx;
114962291463SNavdeep Parhar 	if (ifp->if_capabilities & IFCAP_NETMAP) {
115062291463SNavdeep Parhar 
115162291463SNavdeep Parhar 		/* netmap is supported with direct interrupts only. */
1152f549e352SNavdeep Parhar 		MPASS(!forwarding_intr_to_fwq(sc));
115362291463SNavdeep Parhar 
1154fe2ebb76SJohn Baldwin 		/*
1155fe2ebb76SJohn Baldwin 		 * We don't have buffers to back the netmap rx queues
1156fe2ebb76SJohn Baldwin 		 * right now so we create the queues in a way that
1157fe2ebb76SJohn Baldwin 		 * doesn't set off any congestion signal in the chip.
1158fe2ebb76SJohn Baldwin 		 */
115962291463SNavdeep Parhar 		oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "nm_rxq",
1160fe2ebb76SJohn Baldwin 		    CTLFLAG_RD, NULL, "rx queues");
1161fe2ebb76SJohn Baldwin 		for_each_nm_rxq(vi, i, nm_rxq) {
1162fe2ebb76SJohn Baldwin 			rc = alloc_nm_rxq(vi, nm_rxq, intr_idx, i, oid);
1163fe2ebb76SJohn Baldwin 			if (rc != 0)
1164fe2ebb76SJohn Baldwin 				goto done;
1165fe2ebb76SJohn Baldwin 			intr_idx++;
1166fe2ebb76SJohn Baldwin 		}
1167fe2ebb76SJohn Baldwin 
116862291463SNavdeep Parhar 		oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "nm_txq",
1169fe2ebb76SJohn Baldwin 		    CTLFLAG_RD, NULL, "tx queues");
1170fe2ebb76SJohn Baldwin 		for_each_nm_txq(vi, i, nm_txq) {
1171f549e352SNavdeep Parhar 			iqidx = vi->first_nm_rxq + (i % vi->nnmrxq);
1172f549e352SNavdeep Parhar 			rc = alloc_nm_txq(vi, nm_txq, iqidx, i, oid);
1173fe2ebb76SJohn Baldwin 			if (rc != 0)
1174fe2ebb76SJohn Baldwin 				goto done;
1175fe2ebb76SJohn Baldwin 		}
1176fe2ebb76SJohn Baldwin 	}
117762291463SNavdeep Parhar 
117862291463SNavdeep Parhar 	/* Normal rx queues and netmap rx queues share the same interrupts. */
117962291463SNavdeep Parhar 	intr_idx = saved_idx;
1180fe2ebb76SJohn Baldwin #endif
1181733b9277SNavdeep Parhar 
1182733b9277SNavdeep Parhar 	/*
1183f549e352SNavdeep Parhar 	 * Allocate rx queues first because a default iqid is required when
1184f549e352SNavdeep Parhar 	 * creating a tx queue.
1185733b9277SNavdeep Parhar 	 */
118638035ed6SNavdeep Parhar 	maxp = mtu_to_max_payload(sc, mtu, 0);
1187fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "rxq",
1188298d969cSNavdeep Parhar 	    CTLFLAG_RD, NULL, "rx queues");
1189fe2ebb76SJohn Baldwin 	for_each_rxq(vi, i, rxq) {
119054e4ee71SNavdeep Parhar 
1191fe2ebb76SJohn Baldwin 		init_iq(&rxq->iq, sc, vi->tmr_idx, vi->pktc_idx, vi->qsize_rxq);
119254e4ee71SNavdeep Parhar 
119354e4ee71SNavdeep Parhar 		snprintf(name, sizeof(name), "%s rxq%d-fl",
1194fe2ebb76SJohn Baldwin 		    device_get_nameunit(vi->dev), i);
1195fe2ebb76SJohn Baldwin 		init_fl(sc, &rxq->fl, vi->qsize_rxq / 8, maxp, name);
119654e4ee71SNavdeep Parhar 
1197f549e352SNavdeep Parhar 		rc = alloc_rxq(vi, rxq,
1198f549e352SNavdeep Parhar 		    forwarding_intr_to_fwq(sc) ? -1 : intr_idx, i, oid);
119954e4ee71SNavdeep Parhar 		if (rc != 0)
120054e4ee71SNavdeep Parhar 			goto done;
1201733b9277SNavdeep Parhar 		intr_idx++;
1202733b9277SNavdeep Parhar 	}
120362291463SNavdeep Parhar #ifdef DEV_NETMAP
120462291463SNavdeep Parhar 	if (ifp->if_capabilities & IFCAP_NETMAP)
120562291463SNavdeep Parhar 		intr_idx = saved_idx + max(vi->nrxq, vi->nnmrxq);
120662291463SNavdeep Parhar #endif
120709fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
120838035ed6SNavdeep Parhar 	maxp = mtu_to_max_payload(sc, mtu, 1);
1209fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "ofld_rxq",
1210f549e352SNavdeep Parhar 	    CTLFLAG_RD, NULL, "rx queues for offloaded TCP connections");
1211fe2ebb76SJohn Baldwin 	for_each_ofld_rxq(vi, i, ofld_rxq) {
1212733b9277SNavdeep Parhar 
121308cd1f11SNavdeep Parhar 		init_iq(&ofld_rxq->iq, sc, vi->ofld_tmr_idx, vi->ofld_pktc_idx,
1214fe2ebb76SJohn Baldwin 		    vi->qsize_rxq);
1215733b9277SNavdeep Parhar 
1216733b9277SNavdeep Parhar 		snprintf(name, sizeof(name), "%s ofld_rxq%d-fl",
1217fe2ebb76SJohn Baldwin 		    device_get_nameunit(vi->dev), i);
1218fe2ebb76SJohn Baldwin 		init_fl(sc, &ofld_rxq->fl, vi->qsize_rxq / 8, maxp, name);
1219733b9277SNavdeep Parhar 
1220f549e352SNavdeep Parhar 		rc = alloc_ofld_rxq(vi, ofld_rxq,
1221f549e352SNavdeep Parhar 		    forwarding_intr_to_fwq(sc) ? -1 : intr_idx, i, oid);
1222733b9277SNavdeep Parhar 		if (rc != 0)
1223733b9277SNavdeep Parhar 			goto done;
1224733b9277SNavdeep Parhar 		intr_idx++;
1225733b9277SNavdeep Parhar 	}
1226733b9277SNavdeep Parhar #endif
1227733b9277SNavdeep Parhar 
1228733b9277SNavdeep Parhar 	/*
1229f549e352SNavdeep Parhar 	 * Now the tx queues.
1230733b9277SNavdeep Parhar 	 */
1231fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "txq", CTLFLAG_RD,
1232733b9277SNavdeep Parhar 	    NULL, "tx queues");
1233fe2ebb76SJohn Baldwin 	for_each_txq(vi, i, txq) {
1234f549e352SNavdeep Parhar 		iqidx = vi->first_rxq + (i % vi->nrxq);
123554e4ee71SNavdeep Parhar 		snprintf(name, sizeof(name), "%s txq%d",
1236fe2ebb76SJohn Baldwin 		    device_get_nameunit(vi->dev), i);
1237f549e352SNavdeep Parhar 		init_eq(sc, &txq->eq, EQ_ETH, vi->qsize_txq, pi->tx_chan,
1238f549e352SNavdeep Parhar 		    sc->sge.rxq[iqidx].iq.cntxt_id, name);
123954e4ee71SNavdeep Parhar 
1240fe2ebb76SJohn Baldwin 		rc = alloc_txq(vi, txq, i, oid);
124154e4ee71SNavdeep Parhar 		if (rc != 0)
124254e4ee71SNavdeep Parhar 			goto done;
124354e4ee71SNavdeep Parhar 	}
1244eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
1245fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, "ofld_txq",
1246eff62dbaSNavdeep Parhar 	    CTLFLAG_RD, NULL, "tx queues for TOE/ETHOFLD");
1247fe2ebb76SJohn Baldwin 	for_each_ofld_txq(vi, i, ofld_txq) {
1248298d969cSNavdeep Parhar 		struct sysctl_oid *oid2;
1249733b9277SNavdeep Parhar 
1250733b9277SNavdeep Parhar 		snprintf(name, sizeof(name), "%s ofld_txq%d",
1251fe2ebb76SJohn Baldwin 		    device_get_nameunit(vi->dev), i);
1252c3a88be4SNavdeep Parhar 		if (vi->nofldrxq > 0) {
1253eff62dbaSNavdeep Parhar 			iqidx = vi->first_ofld_rxq + (i % vi->nofldrxq);
1254c3a88be4SNavdeep Parhar 			init_eq(sc, &ofld_txq->eq, EQ_OFLD, vi->qsize_txq,
1255c3a88be4SNavdeep Parhar 			    pi->tx_chan, sc->sge.ofld_rxq[iqidx].iq.cntxt_id,
1256c3a88be4SNavdeep Parhar 			    name);
1257c3a88be4SNavdeep Parhar 		} else {
1258eff62dbaSNavdeep Parhar 			iqidx = vi->first_rxq + (i % vi->nrxq);
1259c3a88be4SNavdeep Parhar 			init_eq(sc, &ofld_txq->eq, EQ_OFLD, vi->qsize_txq,
1260c3a88be4SNavdeep Parhar 			    pi->tx_chan, sc->sge.rxq[iqidx].iq.cntxt_id, name);
1261c3a88be4SNavdeep Parhar 		}
1262733b9277SNavdeep Parhar 
1263733b9277SNavdeep Parhar 		snprintf(name, sizeof(name), "%d", i);
1264fe2ebb76SJohn Baldwin 		oid2 = SYSCTL_ADD_NODE(&vi->ctx, SYSCTL_CHILDREN(oid), OID_AUTO,
1265733b9277SNavdeep Parhar 		    name, CTLFLAG_RD, NULL, "offload tx queue");
1266733b9277SNavdeep Parhar 
1267fe2ebb76SJohn Baldwin 		rc = alloc_wrq(sc, vi, ofld_txq, oid2);
1268298d969cSNavdeep Parhar 		if (rc != 0)
1269298d969cSNavdeep Parhar 			goto done;
1270298d969cSNavdeep Parhar 	}
1271298d969cSNavdeep Parhar #endif
127254e4ee71SNavdeep Parhar done:
127354e4ee71SNavdeep Parhar 	if (rc)
1274fe2ebb76SJohn Baldwin 		t4_teardown_vi_queues(vi);
127554e4ee71SNavdeep Parhar 
127654e4ee71SNavdeep Parhar 	return (rc);
127754e4ee71SNavdeep Parhar }
127854e4ee71SNavdeep Parhar 
127954e4ee71SNavdeep Parhar /*
128054e4ee71SNavdeep Parhar  * Idempotent
128154e4ee71SNavdeep Parhar  */
128254e4ee71SNavdeep Parhar int
1283fe2ebb76SJohn Baldwin t4_teardown_vi_queues(struct vi_info *vi)
128454e4ee71SNavdeep Parhar {
128554e4ee71SNavdeep Parhar 	int i;
128654e4ee71SNavdeep Parhar 	struct sge_rxq *rxq;
128754e4ee71SNavdeep Parhar 	struct sge_txq *txq;
128837310a98SNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
128937310a98SNavdeep Parhar 	struct port_info *pi = vi->pi;
129037310a98SNavdeep Parhar 	struct adapter *sc = pi->adapter;
129137310a98SNavdeep Parhar 	struct sge_wrq *ofld_txq;
129237310a98SNavdeep Parhar #endif
129309fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
1294733b9277SNavdeep Parhar 	struct sge_ofld_rxq *ofld_rxq;
1295eff62dbaSNavdeep Parhar #endif
1296298d969cSNavdeep Parhar #ifdef DEV_NETMAP
1297298d969cSNavdeep Parhar 	struct sge_nm_rxq *nm_rxq;
1298298d969cSNavdeep Parhar 	struct sge_nm_txq *nm_txq;
1299298d969cSNavdeep Parhar #endif
130054e4ee71SNavdeep Parhar 
130154e4ee71SNavdeep Parhar 	/* Do this before freeing the queues */
1302fe2ebb76SJohn Baldwin 	if (vi->flags & VI_SYSCTL_CTX) {
1303fe2ebb76SJohn Baldwin 		sysctl_ctx_free(&vi->ctx);
1304fe2ebb76SJohn Baldwin 		vi->flags &= ~VI_SYSCTL_CTX;
130554e4ee71SNavdeep Parhar 	}
130654e4ee71SNavdeep Parhar 
1307fe2ebb76SJohn Baldwin #ifdef DEV_NETMAP
130862291463SNavdeep Parhar 	if (vi->ifp->if_capabilities & IFCAP_NETMAP) {
1309fe2ebb76SJohn Baldwin 		for_each_nm_txq(vi, i, nm_txq) {
1310fe2ebb76SJohn Baldwin 			free_nm_txq(vi, nm_txq);
1311fe2ebb76SJohn Baldwin 		}
1312fe2ebb76SJohn Baldwin 
1313fe2ebb76SJohn Baldwin 		for_each_nm_rxq(vi, i, nm_rxq) {
1314fe2ebb76SJohn Baldwin 			free_nm_rxq(vi, nm_rxq);
1315fe2ebb76SJohn Baldwin 		}
1316fe2ebb76SJohn Baldwin 	}
1317fe2ebb76SJohn Baldwin #endif
1318fe2ebb76SJohn Baldwin 
1319733b9277SNavdeep Parhar 	/*
1320733b9277SNavdeep Parhar 	 * Take down all the tx queues first, as they reference the rx queues
1321733b9277SNavdeep Parhar 	 * (for egress updates, etc.).
1322733b9277SNavdeep Parhar 	 */
1323733b9277SNavdeep Parhar 
1324fe2ebb76SJohn Baldwin 	for_each_txq(vi, i, txq) {
1325fe2ebb76SJohn Baldwin 		free_txq(vi, txq);
132654e4ee71SNavdeep Parhar 	}
1327eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
1328fe2ebb76SJohn Baldwin 	for_each_ofld_txq(vi, i, ofld_txq) {
1329733b9277SNavdeep Parhar 		free_wrq(sc, ofld_txq);
1330733b9277SNavdeep Parhar 	}
1331733b9277SNavdeep Parhar #endif
1332733b9277SNavdeep Parhar 
1333733b9277SNavdeep Parhar 	/*
1334f549e352SNavdeep Parhar 	 * Then take down the rx queues.
1335733b9277SNavdeep Parhar 	 */
1336733b9277SNavdeep Parhar 
1337fe2ebb76SJohn Baldwin 	for_each_rxq(vi, i, rxq) {
1338fe2ebb76SJohn Baldwin 		free_rxq(vi, rxq);
133954e4ee71SNavdeep Parhar 	}
134009fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
1341fe2ebb76SJohn Baldwin 	for_each_ofld_rxq(vi, i, ofld_rxq) {
1342fe2ebb76SJohn Baldwin 		free_ofld_rxq(vi, ofld_rxq);
1343733b9277SNavdeep Parhar 	}
1344733b9277SNavdeep Parhar #endif
1345733b9277SNavdeep Parhar 
134654e4ee71SNavdeep Parhar 	return (0);
134754e4ee71SNavdeep Parhar }
134854e4ee71SNavdeep Parhar 
1349733b9277SNavdeep Parhar /*
13503098bcfcSNavdeep Parhar  * Interrupt handler when the driver is using only 1 interrupt.  This is a very
13513098bcfcSNavdeep Parhar  * unusual scenario.
13523098bcfcSNavdeep Parhar  *
13533098bcfcSNavdeep Parhar  * a) Deals with errors, if any.
13543098bcfcSNavdeep Parhar  * b) Services firmware event queue, which is taking interrupts for all other
13553098bcfcSNavdeep Parhar  *    queues.
1356733b9277SNavdeep Parhar  */
135754e4ee71SNavdeep Parhar void
135854e4ee71SNavdeep Parhar t4_intr_all(void *arg)
135954e4ee71SNavdeep Parhar {
136054e4ee71SNavdeep Parhar 	struct adapter *sc = arg;
1361733b9277SNavdeep Parhar 	struct sge_iq *fwq = &sc->sge.fwq;
136254e4ee71SNavdeep Parhar 
13633098bcfcSNavdeep Parhar 	MPASS(sc->intr_count == 1);
13643098bcfcSNavdeep Parhar 
136554e4ee71SNavdeep Parhar 	t4_intr_err(arg);
13663098bcfcSNavdeep Parhar 	t4_intr_evt(fwq);
136754e4ee71SNavdeep Parhar }
136854e4ee71SNavdeep Parhar 
13693098bcfcSNavdeep Parhar /*
13703098bcfcSNavdeep Parhar  * Interrupt handler for errors (installed directly when multiple interrupts are
13713098bcfcSNavdeep Parhar  * being used, or called by t4_intr_all).
13723098bcfcSNavdeep Parhar  */
137354e4ee71SNavdeep Parhar void
137454e4ee71SNavdeep Parhar t4_intr_err(void *arg)
137554e4ee71SNavdeep Parhar {
137654e4ee71SNavdeep Parhar 	struct adapter *sc = arg;
137754e4ee71SNavdeep Parhar 
137854e4ee71SNavdeep Parhar 	t4_write_reg(sc, MYPF_REG(A_PCIE_PF_CLI), 0);
137954e4ee71SNavdeep Parhar 	t4_slow_intr_handler(sc);
138054e4ee71SNavdeep Parhar }
138154e4ee71SNavdeep Parhar 
13823098bcfcSNavdeep Parhar /*
13833098bcfcSNavdeep Parhar  * Interrupt handler for iq-only queues.  The firmware event queue is the only
13843098bcfcSNavdeep Parhar  * such queue right now.
13853098bcfcSNavdeep Parhar  */
138654e4ee71SNavdeep Parhar void
138754e4ee71SNavdeep Parhar t4_intr_evt(void *arg)
138854e4ee71SNavdeep Parhar {
138954e4ee71SNavdeep Parhar 	struct sge_iq *iq = arg;
13902be67d29SNavdeep Parhar 
1391733b9277SNavdeep Parhar 	if (atomic_cmpset_int(&iq->state, IQS_IDLE, IQS_BUSY)) {
1392733b9277SNavdeep Parhar 		service_iq(iq, 0);
1393da6e3387SNavdeep Parhar 		(void) atomic_cmpset_int(&iq->state, IQS_BUSY, IQS_IDLE);
13942be67d29SNavdeep Parhar 	}
13952be67d29SNavdeep Parhar }
13962be67d29SNavdeep Parhar 
13973098bcfcSNavdeep Parhar /*
13983098bcfcSNavdeep Parhar  * Interrupt handler for iq+fl queues.
13993098bcfcSNavdeep Parhar  */
1400733b9277SNavdeep Parhar void
1401733b9277SNavdeep Parhar t4_intr(void *arg)
14022be67d29SNavdeep Parhar {
14032be67d29SNavdeep Parhar 	struct sge_iq *iq = arg;
1404733b9277SNavdeep Parhar 
1405733b9277SNavdeep Parhar 	if (atomic_cmpset_int(&iq->state, IQS_IDLE, IQS_BUSY)) {
14063098bcfcSNavdeep Parhar 		service_iq_fl(iq, 0);
1407da6e3387SNavdeep Parhar 		(void) atomic_cmpset_int(&iq->state, IQS_BUSY, IQS_IDLE);
1408733b9277SNavdeep Parhar 	}
1409733b9277SNavdeep Parhar }
1410733b9277SNavdeep Parhar 
14113098bcfcSNavdeep Parhar #ifdef DEV_NETMAP
14123098bcfcSNavdeep Parhar /*
14133098bcfcSNavdeep Parhar  * Interrupt handler for netmap rx queues.
14143098bcfcSNavdeep Parhar  */
14153098bcfcSNavdeep Parhar void
14163098bcfcSNavdeep Parhar t4_nm_intr(void *arg)
14173098bcfcSNavdeep Parhar {
14183098bcfcSNavdeep Parhar 	struct sge_nm_rxq *nm_rxq = arg;
14193098bcfcSNavdeep Parhar 
14203098bcfcSNavdeep Parhar 	if (atomic_cmpset_int(&nm_rxq->nm_state, NM_ON, NM_BUSY)) {
14213098bcfcSNavdeep Parhar 		service_nm_rxq(nm_rxq);
1422da6e3387SNavdeep Parhar 		(void) atomic_cmpset_int(&nm_rxq->nm_state, NM_BUSY, NM_ON);
14233098bcfcSNavdeep Parhar 	}
14243098bcfcSNavdeep Parhar }
14253098bcfcSNavdeep Parhar 
14263098bcfcSNavdeep Parhar /*
14273098bcfcSNavdeep Parhar  * Interrupt handler for vectors shared between NIC and netmap rx queues.
14283098bcfcSNavdeep Parhar  */
142962291463SNavdeep Parhar void
143062291463SNavdeep Parhar t4_vi_intr(void *arg)
143162291463SNavdeep Parhar {
143262291463SNavdeep Parhar 	struct irq *irq = arg;
143362291463SNavdeep Parhar 
14343098bcfcSNavdeep Parhar 	MPASS(irq->nm_rxq != NULL);
143562291463SNavdeep Parhar 	t4_nm_intr(irq->nm_rxq);
14363098bcfcSNavdeep Parhar 
14373098bcfcSNavdeep Parhar 	MPASS(irq->rxq != NULL);
143862291463SNavdeep Parhar 	t4_intr(irq->rxq);
143962291463SNavdeep Parhar }
14403098bcfcSNavdeep Parhar #endif
144146f48ee5SNavdeep Parhar 
1442733b9277SNavdeep Parhar /*
14433098bcfcSNavdeep Parhar  * Deals with interrupts on an iq-only (no freelist) queue.
1444733b9277SNavdeep Parhar  */
1445733b9277SNavdeep Parhar static int
1446733b9277SNavdeep Parhar service_iq(struct sge_iq *iq, int budget)
1447733b9277SNavdeep Parhar {
1448733b9277SNavdeep Parhar 	struct sge_iq *q;
144954e4ee71SNavdeep Parhar 	struct adapter *sc = iq->adapter;
1450b2daa9a9SNavdeep Parhar 	struct iq_desc *d = &iq->desc[iq->cidx];
14514d6db4e0SNavdeep Parhar 	int ndescs = 0, limit;
14523098bcfcSNavdeep Parhar 	int rsp_type;
1453733b9277SNavdeep Parhar 	uint32_t lq;
1454733b9277SNavdeep Parhar 	STAILQ_HEAD(, sge_iq) iql = STAILQ_HEAD_INITIALIZER(iql);
1455733b9277SNavdeep Parhar 
1456733b9277SNavdeep Parhar 	KASSERT(iq->state == IQS_BUSY, ("%s: iq %p not BUSY", __func__, iq));
14573098bcfcSNavdeep Parhar 	KASSERT((iq->flags & IQ_HAS_FL) == 0,
14583098bcfcSNavdeep Parhar 	    ("%s: called for iq %p with fl (iq->flags 0x%x)", __func__, iq,
14593098bcfcSNavdeep Parhar 	    iq->flags));
14603098bcfcSNavdeep Parhar 	MPASS((iq->flags & IQ_ADJ_CREDIT) == 0);
14613098bcfcSNavdeep Parhar 	MPASS((iq->flags & IQ_LRO_ENABLED) == 0);
1462733b9277SNavdeep Parhar 
14634d6db4e0SNavdeep Parhar 	limit = budget ? budget : iq->qsize / 16;
14644d6db4e0SNavdeep Parhar 
1465733b9277SNavdeep Parhar 	/*
1466733b9277SNavdeep Parhar 	 * We always come back and check the descriptor ring for new indirect
1467733b9277SNavdeep Parhar 	 * interrupts and other responses after running a single handler.
1468733b9277SNavdeep Parhar 	 */
1469733b9277SNavdeep Parhar 	for (;;) {
1470b2daa9a9SNavdeep Parhar 		while ((d->rsp.u.type_gen & F_RSPD_GEN) == iq->gen) {
147154e4ee71SNavdeep Parhar 
147254e4ee71SNavdeep Parhar 			rmb();
147354e4ee71SNavdeep Parhar 
1474b2daa9a9SNavdeep Parhar 			rsp_type = G_RSPD_TYPE(d->rsp.u.type_gen);
1475b2daa9a9SNavdeep Parhar 			lq = be32toh(d->rsp.pldbuflen_qid);
147654e4ee71SNavdeep Parhar 
1477733b9277SNavdeep Parhar 			switch (rsp_type) {
1478733b9277SNavdeep Parhar 			case X_RSPD_TYPE_FLBUF:
14793098bcfcSNavdeep Parhar 				panic("%s: data for an iq (%p) with no freelist",
14803098bcfcSNavdeep Parhar 				    __func__, iq);
148154e4ee71SNavdeep Parhar 
14823098bcfcSNavdeep Parhar 				/* NOTREACHED */
1483733b9277SNavdeep Parhar 
1484733b9277SNavdeep Parhar 			case X_RSPD_TYPE_CPL:
1485b2daa9a9SNavdeep Parhar 				KASSERT(d->rss.opcode < NUM_CPL_CMDS,
1486733b9277SNavdeep Parhar 				    ("%s: bad opcode %02x.", __func__,
1487b2daa9a9SNavdeep Parhar 				    d->rss.opcode));
14883098bcfcSNavdeep Parhar 				t4_cpl_handler[d->rss.opcode](iq, &d->rss, NULL);
1489733b9277SNavdeep Parhar 				break;
1490733b9277SNavdeep Parhar 
1491733b9277SNavdeep Parhar 			case X_RSPD_TYPE_INTR:
149298005176SNavdeep Parhar 				/*
149398005176SNavdeep Parhar 				 * There are 1K interrupt-capable queues (qids 0
149498005176SNavdeep Parhar 				 * through 1023).  A response type indicating a
149598005176SNavdeep Parhar 				 * forwarded interrupt with a qid >= 1K is an
149698005176SNavdeep Parhar 				 * iWARP async notification.
149798005176SNavdeep Parhar 				 */
14983098bcfcSNavdeep Parhar 				if (__predict_true(lq >= 1024)) {
1499671bf2b8SNavdeep Parhar 					t4_an_handler(iq, &d->rsp);
150098005176SNavdeep Parhar 					break;
150198005176SNavdeep Parhar 				}
150298005176SNavdeep Parhar 
1503ec55567cSJohn Baldwin 				q = sc->sge.iqmap[lq - sc->sge.iq_start -
1504ec55567cSJohn Baldwin 				    sc->sge.iq_base];
1505733b9277SNavdeep Parhar 				if (atomic_cmpset_int(&q->state, IQS_IDLE,
1506733b9277SNavdeep Parhar 				    IQS_BUSY)) {
15073098bcfcSNavdeep Parhar 					if (service_iq_fl(q, q->qsize / 16) == 0) {
1508da6e3387SNavdeep Parhar 						(void) atomic_cmpset_int(&q->state,
1509733b9277SNavdeep Parhar 						    IQS_BUSY, IQS_IDLE);
1510733b9277SNavdeep Parhar 					} else {
1511733b9277SNavdeep Parhar 						STAILQ_INSERT_TAIL(&iql, q,
1512733b9277SNavdeep Parhar 						    link);
1513733b9277SNavdeep Parhar 					}
1514733b9277SNavdeep Parhar 				}
1515733b9277SNavdeep Parhar 				break;
1516733b9277SNavdeep Parhar 
1517733b9277SNavdeep Parhar 			default:
151898005176SNavdeep Parhar 				KASSERT(0,
151998005176SNavdeep Parhar 				    ("%s: illegal response type %d on iq %p",
152098005176SNavdeep Parhar 				    __func__, rsp_type, iq));
152198005176SNavdeep Parhar 				log(LOG_ERR,
152298005176SNavdeep Parhar 				    "%s: illegal response type %d on iq %p",
152398005176SNavdeep Parhar 				    device_get_nameunit(sc->dev), rsp_type, iq);
152409fe6320SNavdeep Parhar 				break;
152554e4ee71SNavdeep Parhar 			}
152656599263SNavdeep Parhar 
1527b2daa9a9SNavdeep Parhar 			d++;
1528b2daa9a9SNavdeep Parhar 			if (__predict_false(++iq->cidx == iq->sidx)) {
1529b2daa9a9SNavdeep Parhar 				iq->cidx = 0;
1530b2daa9a9SNavdeep Parhar 				iq->gen ^= F_RSPD_GEN;
1531b2daa9a9SNavdeep Parhar 				d = &iq->desc[0];
1532b2daa9a9SNavdeep Parhar 			}
1533b2daa9a9SNavdeep Parhar 			if (__predict_false(++ndescs == limit)) {
1534315048f2SJohn Baldwin 				t4_write_reg(sc, sc->sge_gts_reg,
1535733b9277SNavdeep Parhar 				    V_CIDXINC(ndescs) |
1536733b9277SNavdeep Parhar 				    V_INGRESSQID(iq->cntxt_id) |
1537733b9277SNavdeep Parhar 				    V_SEINTARM(V_QINTR_TIMER_IDX(X_TIMERREG_UPDATE_CIDX)));
1538733b9277SNavdeep Parhar 				ndescs = 0;
1539733b9277SNavdeep Parhar 
15403098bcfcSNavdeep Parhar 				if (budget) {
15413098bcfcSNavdeep Parhar 					return (EINPROGRESS);
15423098bcfcSNavdeep Parhar 				}
15433098bcfcSNavdeep Parhar 			}
15443098bcfcSNavdeep Parhar 		}
15453098bcfcSNavdeep Parhar 
15463098bcfcSNavdeep Parhar 		if (STAILQ_EMPTY(&iql))
15473098bcfcSNavdeep Parhar 			break;
15483098bcfcSNavdeep Parhar 
15493098bcfcSNavdeep Parhar 		/*
15503098bcfcSNavdeep Parhar 		 * Process the head only, and send it to the back of the list if
15513098bcfcSNavdeep Parhar 		 * it's still not done.
15523098bcfcSNavdeep Parhar 		 */
15533098bcfcSNavdeep Parhar 		q = STAILQ_FIRST(&iql);
15543098bcfcSNavdeep Parhar 		STAILQ_REMOVE_HEAD(&iql, link);
15553098bcfcSNavdeep Parhar 		if (service_iq_fl(q, q->qsize / 8) == 0)
1556da6e3387SNavdeep Parhar 			(void) atomic_cmpset_int(&q->state, IQS_BUSY, IQS_IDLE);
15573098bcfcSNavdeep Parhar 		else
15583098bcfcSNavdeep Parhar 			STAILQ_INSERT_TAIL(&iql, q, link);
15593098bcfcSNavdeep Parhar 	}
15603098bcfcSNavdeep Parhar 
15613098bcfcSNavdeep Parhar 	t4_write_reg(sc, sc->sge_gts_reg, V_CIDXINC(ndescs) |
15623098bcfcSNavdeep Parhar 	    V_INGRESSQID((u32)iq->cntxt_id) | V_SEINTARM(iq->intr_params));
15633098bcfcSNavdeep Parhar 
15643098bcfcSNavdeep Parhar 	return (0);
15653098bcfcSNavdeep Parhar }
15663098bcfcSNavdeep Parhar 
15673098bcfcSNavdeep Parhar static inline int
15683098bcfcSNavdeep Parhar sort_before_lro(struct lro_ctrl *lro)
15693098bcfcSNavdeep Parhar {
15703098bcfcSNavdeep Parhar 
15713098bcfcSNavdeep Parhar 	return (lro->lro_mbuf_max != 0);
15723098bcfcSNavdeep Parhar }
15733098bcfcSNavdeep Parhar 
1574e7e08444SNavdeep Parhar static inline uint64_t
1575e7e08444SNavdeep Parhar last_flit_to_ns(struct adapter *sc, uint64_t lf)
1576e7e08444SNavdeep Parhar {
1577e7e08444SNavdeep Parhar 	uint64_t n = be64toh(lf) & 0xfffffffffffffff;	/* 60b, not 64b. */
1578e7e08444SNavdeep Parhar 
1579e7e08444SNavdeep Parhar 	if (n > UINT64_MAX / 1000000)
1580e7e08444SNavdeep Parhar 		return (n / sc->params.vpd.cclk * 1000000);
1581e7e08444SNavdeep Parhar 	else
1582e7e08444SNavdeep Parhar 		return (n * 1000000 / sc->params.vpd.cclk);
1583e7e08444SNavdeep Parhar }
1584e7e08444SNavdeep Parhar 
15853098bcfcSNavdeep Parhar /*
15863098bcfcSNavdeep Parhar  * Deals with interrupts on an iq+fl queue.
15873098bcfcSNavdeep Parhar  */
15883098bcfcSNavdeep Parhar static int
15893098bcfcSNavdeep Parhar service_iq_fl(struct sge_iq *iq, int budget)
15903098bcfcSNavdeep Parhar {
15913098bcfcSNavdeep Parhar 	struct sge_rxq *rxq = iq_to_rxq(iq);
15923098bcfcSNavdeep Parhar 	struct sge_fl *fl;
15933098bcfcSNavdeep Parhar 	struct adapter *sc = iq->adapter;
15943098bcfcSNavdeep Parhar 	struct iq_desc *d = &iq->desc[iq->cidx];
15953098bcfcSNavdeep Parhar 	int ndescs = 0, limit;
15963098bcfcSNavdeep Parhar 	int rsp_type, refill, starved;
15973098bcfcSNavdeep Parhar 	uint32_t lq;
15983098bcfcSNavdeep Parhar 	uint16_t fl_hw_cidx;
15993098bcfcSNavdeep Parhar 	struct mbuf *m0;
16003098bcfcSNavdeep Parhar #if defined(INET) || defined(INET6)
16013098bcfcSNavdeep Parhar 	const struct timeval lro_timeout = {0, sc->lro_timeout};
16023098bcfcSNavdeep Parhar 	struct lro_ctrl *lro = &rxq->lro;
16033098bcfcSNavdeep Parhar #endif
16043098bcfcSNavdeep Parhar 
16053098bcfcSNavdeep Parhar 	KASSERT(iq->state == IQS_BUSY, ("%s: iq %p not BUSY", __func__, iq));
16063098bcfcSNavdeep Parhar 	MPASS(iq->flags & IQ_HAS_FL);
16073098bcfcSNavdeep Parhar 
16083098bcfcSNavdeep Parhar 	limit = budget ? budget : iq->qsize / 16;
16093098bcfcSNavdeep Parhar 	fl = &rxq->fl;
16103098bcfcSNavdeep Parhar 	fl_hw_cidx = fl->hw_cidx;	/* stable snapshot */
16113098bcfcSNavdeep Parhar 
16123098bcfcSNavdeep Parhar #if defined(INET) || defined(INET6)
16133098bcfcSNavdeep Parhar 	if (iq->flags & IQ_ADJ_CREDIT) {
16143098bcfcSNavdeep Parhar 		MPASS(sort_before_lro(lro));
16153098bcfcSNavdeep Parhar 		iq->flags &= ~IQ_ADJ_CREDIT;
16163098bcfcSNavdeep Parhar 		if ((d->rsp.u.type_gen & F_RSPD_GEN) != iq->gen) {
16173098bcfcSNavdeep Parhar 			tcp_lro_flush_all(lro);
16183098bcfcSNavdeep Parhar 			t4_write_reg(sc, sc->sge_gts_reg, V_CIDXINC(1) |
16193098bcfcSNavdeep Parhar 			    V_INGRESSQID((u32)iq->cntxt_id) |
16203098bcfcSNavdeep Parhar 			    V_SEINTARM(iq->intr_params));
16213098bcfcSNavdeep Parhar 			return (0);
16223098bcfcSNavdeep Parhar 		}
16233098bcfcSNavdeep Parhar 		ndescs = 1;
16243098bcfcSNavdeep Parhar 	}
16253098bcfcSNavdeep Parhar #else
16263098bcfcSNavdeep Parhar 	MPASS((iq->flags & IQ_ADJ_CREDIT) == 0);
16273098bcfcSNavdeep Parhar #endif
16283098bcfcSNavdeep Parhar 
16293098bcfcSNavdeep Parhar 	while ((d->rsp.u.type_gen & F_RSPD_GEN) == iq->gen) {
16303098bcfcSNavdeep Parhar 
16313098bcfcSNavdeep Parhar 		rmb();
16323098bcfcSNavdeep Parhar 
16333098bcfcSNavdeep Parhar 		refill = 0;
16343098bcfcSNavdeep Parhar 		m0 = NULL;
16353098bcfcSNavdeep Parhar 		rsp_type = G_RSPD_TYPE(d->rsp.u.type_gen);
16363098bcfcSNavdeep Parhar 		lq = be32toh(d->rsp.pldbuflen_qid);
16373098bcfcSNavdeep Parhar 
16383098bcfcSNavdeep Parhar 		switch (rsp_type) {
16393098bcfcSNavdeep Parhar 		case X_RSPD_TYPE_FLBUF:
16403098bcfcSNavdeep Parhar 
16413098bcfcSNavdeep Parhar 			m0 = get_fl_payload(sc, fl, lq);
16423098bcfcSNavdeep Parhar 			if (__predict_false(m0 == NULL))
16433098bcfcSNavdeep Parhar 				goto out;
16443098bcfcSNavdeep Parhar 			refill = IDXDIFF(fl->hw_cidx, fl_hw_cidx, fl->sidx) > 2;
1645e7e08444SNavdeep Parhar 
1646e7e08444SNavdeep Parhar 			if (iq->flags & IQ_RX_TIMESTAMP) {
16473098bcfcSNavdeep Parhar 				/*
1648e7e08444SNavdeep Parhar 				 * Fill up rcv_tstmp but do not set M_TSTMP.
1649e7e08444SNavdeep Parhar 				 * rcv_tstmp is not in the format that the
1650e7e08444SNavdeep Parhar 				 * kernel expects and we don't want to mislead
1651e7e08444SNavdeep Parhar 				 * it.  For now this is only for custom code
1652e7e08444SNavdeep Parhar 				 * that knows how to interpret cxgbe's stamp.
16533098bcfcSNavdeep Parhar 				 */
1654e7e08444SNavdeep Parhar 				m0->m_pkthdr.rcv_tstmp =
1655e7e08444SNavdeep Parhar 				    last_flit_to_ns(sc, d->rsp.u.last_flit);
1656e7e08444SNavdeep Parhar #ifdef notyet
1657e7e08444SNavdeep Parhar 				m0->m_flags |= M_TSTMP;
16583098bcfcSNavdeep Parhar #endif
1659e7e08444SNavdeep Parhar 			}
16603098bcfcSNavdeep Parhar 
16613098bcfcSNavdeep Parhar 			/* fall through */
16623098bcfcSNavdeep Parhar 
16633098bcfcSNavdeep Parhar 		case X_RSPD_TYPE_CPL:
16643098bcfcSNavdeep Parhar 			KASSERT(d->rss.opcode < NUM_CPL_CMDS,
16653098bcfcSNavdeep Parhar 			    ("%s: bad opcode %02x.", __func__, d->rss.opcode));
16663098bcfcSNavdeep Parhar 			t4_cpl_handler[d->rss.opcode](iq, &d->rss, m0);
16673098bcfcSNavdeep Parhar 			break;
16683098bcfcSNavdeep Parhar 
16693098bcfcSNavdeep Parhar 		case X_RSPD_TYPE_INTR:
16703098bcfcSNavdeep Parhar 
16713098bcfcSNavdeep Parhar 			/*
16723098bcfcSNavdeep Parhar 			 * There are 1K interrupt-capable queues (qids 0
16733098bcfcSNavdeep Parhar 			 * through 1023).  A response type indicating a
16743098bcfcSNavdeep Parhar 			 * forwarded interrupt with a qid >= 1K is an
16753098bcfcSNavdeep Parhar 			 * iWARP async notification.  That is the only
16763098bcfcSNavdeep Parhar 			 * acceptable indirect interrupt on this queue.
16773098bcfcSNavdeep Parhar 			 */
16783098bcfcSNavdeep Parhar 			if (__predict_false(lq < 1024)) {
16793098bcfcSNavdeep Parhar 				panic("%s: indirect interrupt on iq_fl %p "
16803098bcfcSNavdeep Parhar 				    "with qid %u", __func__, iq, lq);
16813098bcfcSNavdeep Parhar 			}
16823098bcfcSNavdeep Parhar 
16833098bcfcSNavdeep Parhar 			t4_an_handler(iq, &d->rsp);
16843098bcfcSNavdeep Parhar 			break;
16853098bcfcSNavdeep Parhar 
16863098bcfcSNavdeep Parhar 		default:
16873098bcfcSNavdeep Parhar 			KASSERT(0, ("%s: illegal response type %d on iq %p",
16883098bcfcSNavdeep Parhar 			    __func__, rsp_type, iq));
16893098bcfcSNavdeep Parhar 			log(LOG_ERR, "%s: illegal response type %d on iq %p",
16903098bcfcSNavdeep Parhar 			    device_get_nameunit(sc->dev), rsp_type, iq);
16913098bcfcSNavdeep Parhar 			break;
16923098bcfcSNavdeep Parhar 		}
16933098bcfcSNavdeep Parhar 
16943098bcfcSNavdeep Parhar 		d++;
16953098bcfcSNavdeep Parhar 		if (__predict_false(++iq->cidx == iq->sidx)) {
16963098bcfcSNavdeep Parhar 			iq->cidx = 0;
16973098bcfcSNavdeep Parhar 			iq->gen ^= F_RSPD_GEN;
16983098bcfcSNavdeep Parhar 			d = &iq->desc[0];
16993098bcfcSNavdeep Parhar 		}
17003098bcfcSNavdeep Parhar 		if (__predict_false(++ndescs == limit)) {
17013098bcfcSNavdeep Parhar 			t4_write_reg(sc, sc->sge_gts_reg, V_CIDXINC(ndescs) |
17023098bcfcSNavdeep Parhar 			    V_INGRESSQID(iq->cntxt_id) |
17033098bcfcSNavdeep Parhar 			    V_SEINTARM(V_QINTR_TIMER_IDX(X_TIMERREG_UPDATE_CIDX)));
17043098bcfcSNavdeep Parhar 			ndescs = 0;
17053098bcfcSNavdeep Parhar 
1706480e603cSNavdeep Parhar #if defined(INET) || defined(INET6)
1707480e603cSNavdeep Parhar 			if (iq->flags & IQ_LRO_ENABLED &&
170846f48ee5SNavdeep Parhar 			    !sort_before_lro(lro) &&
1709480e603cSNavdeep Parhar 			    sc->lro_timeout != 0) {
17103098bcfcSNavdeep Parhar 				tcp_lro_flush_inactive(lro, &lro_timeout);
1711480e603cSNavdeep Parhar 			}
1712480e603cSNavdeep Parhar #endif
1713861e42b2SNavdeep Parhar 			if (budget) {
1714861e42b2SNavdeep Parhar 				FL_LOCK(fl);
1715861e42b2SNavdeep Parhar 				refill_fl(sc, fl, 32);
1716861e42b2SNavdeep Parhar 				FL_UNLOCK(fl);
17173098bcfcSNavdeep Parhar 
1718733b9277SNavdeep Parhar 				return (EINPROGRESS);
171954e4ee71SNavdeep Parhar 			}
1720733b9277SNavdeep Parhar 		}
17214d6db4e0SNavdeep Parhar 		if (refill) {
17224d6db4e0SNavdeep Parhar 			FL_LOCK(fl);
17234d6db4e0SNavdeep Parhar 			refill_fl(sc, fl, 32);
17244d6db4e0SNavdeep Parhar 			FL_UNLOCK(fl);
17254d6db4e0SNavdeep Parhar 			fl_hw_cidx = fl->hw_cidx;
17264d6db4e0SNavdeep Parhar 		}
1727861e42b2SNavdeep Parhar 	}
17283098bcfcSNavdeep Parhar out:
1729a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
1730733b9277SNavdeep Parhar 	if (iq->flags & IQ_LRO_ENABLED) {
173146f48ee5SNavdeep Parhar 		if (ndescs > 0 && lro->lro_mbuf_count > 8) {
173246f48ee5SNavdeep Parhar 			MPASS(sort_before_lro(lro));
173346f48ee5SNavdeep Parhar 			/* hold back one credit and don't flush LRO state */
173446f48ee5SNavdeep Parhar 			iq->flags |= IQ_ADJ_CREDIT;
173546f48ee5SNavdeep Parhar 			ndescs--;
173646f48ee5SNavdeep Parhar 		} else {
17376dd38b87SSepherosa Ziehau 			tcp_lro_flush_all(lro);
1738733b9277SNavdeep Parhar 		}
173946f48ee5SNavdeep Parhar 	}
1740733b9277SNavdeep Parhar #endif
1741733b9277SNavdeep Parhar 
1742315048f2SJohn Baldwin 	t4_write_reg(sc, sc->sge_gts_reg, V_CIDXINC(ndescs) |
1743733b9277SNavdeep Parhar 	    V_INGRESSQID((u32)iq->cntxt_id) | V_SEINTARM(iq->intr_params));
1744733b9277SNavdeep Parhar 
1745733b9277SNavdeep Parhar 	FL_LOCK(fl);
174638035ed6SNavdeep Parhar 	starved = refill_fl(sc, fl, 64);
1747733b9277SNavdeep Parhar 	FL_UNLOCK(fl);
1748733b9277SNavdeep Parhar 	if (__predict_false(starved != 0))
1749733b9277SNavdeep Parhar 		add_fl_to_sfl(sc, fl);
1750733b9277SNavdeep Parhar 
1751733b9277SNavdeep Parhar 	return (0);
1752733b9277SNavdeep Parhar }
1753733b9277SNavdeep Parhar 
175438035ed6SNavdeep Parhar static inline int
175538035ed6SNavdeep Parhar cl_has_metadata(struct sge_fl *fl, struct cluster_layout *cll)
17561458bff9SNavdeep Parhar {
175738035ed6SNavdeep Parhar 	int rc = fl->flags & FL_BUF_PACKING || cll->region1 > 0;
17581458bff9SNavdeep Parhar 
175938035ed6SNavdeep Parhar 	if (rc)
176038035ed6SNavdeep Parhar 		MPASS(cll->region3 >= CL_METADATA_SIZE);
176138035ed6SNavdeep Parhar 
176238035ed6SNavdeep Parhar 	return (rc);
17631458bff9SNavdeep Parhar }
17641458bff9SNavdeep Parhar 
176538035ed6SNavdeep Parhar static inline struct cluster_metadata *
176638035ed6SNavdeep Parhar cl_metadata(struct adapter *sc, struct sge_fl *fl, struct cluster_layout *cll,
176738035ed6SNavdeep Parhar     caddr_t cl)
17681458bff9SNavdeep Parhar {
17691458bff9SNavdeep Parhar 
177038035ed6SNavdeep Parhar 	if (cl_has_metadata(fl, cll)) {
177138035ed6SNavdeep Parhar 		struct sw_zone_info *swz = &sc->sge.sw_zone_info[cll->zidx];
17721458bff9SNavdeep Parhar 
177338035ed6SNavdeep Parhar 		return ((struct cluster_metadata *)(cl + swz->size) - 1);
17741458bff9SNavdeep Parhar 	}
177538035ed6SNavdeep Parhar 	return (NULL);
17761458bff9SNavdeep Parhar }
17771458bff9SNavdeep Parhar 
177815c28f87SGleb Smirnoff static void
1779e8fd18f3SGleb Smirnoff rxb_free(struct mbuf *m)
17801458bff9SNavdeep Parhar {
1781e8fd18f3SGleb Smirnoff 	uma_zone_t zone = m->m_ext.ext_arg1;
1782e8fd18f3SGleb Smirnoff 	void *cl = m->m_ext.ext_arg2;
17831458bff9SNavdeep Parhar 
17841458bff9SNavdeep Parhar 	uma_zfree(zone, cl);
178582eff304SNavdeep Parhar 	counter_u64_add(extfree_rels, 1);
17861458bff9SNavdeep Parhar }
17871458bff9SNavdeep Parhar 
178838035ed6SNavdeep Parhar /*
178938035ed6SNavdeep Parhar  * The mbuf returned by this function could be allocated from zone_mbuf or
179038035ed6SNavdeep Parhar  * constructed in spare room in the cluster.
179138035ed6SNavdeep Parhar  *
179238035ed6SNavdeep Parhar  * The mbuf carries the payload in one of these ways
179338035ed6SNavdeep Parhar  * a) frame inside the mbuf (mbuf from zone_mbuf)
179438035ed6SNavdeep Parhar  * b) m_cljset (for clusters without metadata) zone_mbuf
179538035ed6SNavdeep Parhar  * c) m_extaddref (cluster with metadata) inline mbuf
179638035ed6SNavdeep Parhar  * d) m_extaddref (cluster with metadata) zone_mbuf
179738035ed6SNavdeep Parhar  */
17981458bff9SNavdeep Parhar static struct mbuf *
1799b741402cSNavdeep Parhar get_scatter_segment(struct adapter *sc, struct sge_fl *fl, int fr_offset,
1800b741402cSNavdeep Parhar     int remaining)
180138035ed6SNavdeep Parhar {
180238035ed6SNavdeep Parhar 	struct mbuf *m;
180338035ed6SNavdeep Parhar 	struct fl_sdesc *sd = &fl->sdesc[fl->cidx];
180438035ed6SNavdeep Parhar 	struct cluster_layout *cll = &sd->cll;
180538035ed6SNavdeep Parhar 	struct sw_zone_info *swz = &sc->sge.sw_zone_info[cll->zidx];
180638035ed6SNavdeep Parhar 	struct hw_buf_info *hwb = &sc->sge.hw_buf_info[cll->hwidx];
180738035ed6SNavdeep Parhar 	struct cluster_metadata *clm = cl_metadata(sc, fl, cll, sd->cl);
1808b741402cSNavdeep Parhar 	int len, blen;
180938035ed6SNavdeep Parhar 	caddr_t payload;
181038035ed6SNavdeep Parhar 
1811b741402cSNavdeep Parhar 	blen = hwb->size - fl->rx_offset;	/* max possible in this buf */
1812b741402cSNavdeep Parhar 	len = min(remaining, blen);
181338035ed6SNavdeep Parhar 	payload = sd->cl + cll->region1 + fl->rx_offset;
1814e3207e19SNavdeep Parhar 	if (fl->flags & FL_BUF_PACKING) {
1815b741402cSNavdeep Parhar 		const u_int l = fr_offset + len;
1816b741402cSNavdeep Parhar 		const u_int pad = roundup2(l, fl->buf_boundary) - l;
1817b741402cSNavdeep Parhar 
1818b741402cSNavdeep Parhar 		if (fl->rx_offset + len + pad < hwb->size)
1819b741402cSNavdeep Parhar 			blen = len + pad;
1820b741402cSNavdeep Parhar 		MPASS(fl->rx_offset + blen <= hwb->size);
1821e3207e19SNavdeep Parhar 	} else {
1822e3207e19SNavdeep Parhar 		MPASS(fl->rx_offset == 0);	/* not packing */
1823e3207e19SNavdeep Parhar 	}
182438035ed6SNavdeep Parhar 
1825b741402cSNavdeep Parhar 
182638035ed6SNavdeep Parhar 	if (sc->sc_do_rxcopy && len < RX_COPY_THRESHOLD) {
182738035ed6SNavdeep Parhar 
182838035ed6SNavdeep Parhar 		/*
182938035ed6SNavdeep Parhar 		 * Copy payload into a freshly allocated mbuf.
183038035ed6SNavdeep Parhar 		 */
183138035ed6SNavdeep Parhar 
1832b741402cSNavdeep Parhar 		m = fr_offset == 0 ?
183338035ed6SNavdeep Parhar 		    m_gethdr(M_NOWAIT, MT_DATA) : m_get(M_NOWAIT, MT_DATA);
183438035ed6SNavdeep Parhar 		if (m == NULL)
183538035ed6SNavdeep Parhar 			return (NULL);
183638035ed6SNavdeep Parhar 		fl->mbuf_allocated++;
1837e7e08444SNavdeep Parhar 
183838035ed6SNavdeep Parhar 		/* copy data to mbuf */
183938035ed6SNavdeep Parhar 		bcopy(payload, mtod(m, caddr_t), len);
184038035ed6SNavdeep Parhar 
1841c3fb7725SNavdeep Parhar 	} else if (sd->nmbuf * MSIZE < cll->region1) {
184238035ed6SNavdeep Parhar 
184338035ed6SNavdeep Parhar 		/*
184438035ed6SNavdeep Parhar 		 * There's spare room in the cluster for an mbuf.  Create one
1845ccc69b2fSNavdeep Parhar 		 * and associate it with the payload that's in the cluster.
184638035ed6SNavdeep Parhar 		 */
184738035ed6SNavdeep Parhar 
184838035ed6SNavdeep Parhar 		MPASS(clm != NULL);
1849c3fb7725SNavdeep Parhar 		m = (struct mbuf *)(sd->cl + sd->nmbuf * MSIZE);
185038035ed6SNavdeep Parhar 		/* No bzero required */
1851b4b12e52SGleb Smirnoff 		if (m_init(m, M_NOWAIT, MT_DATA,
1852b741402cSNavdeep Parhar 		    fr_offset == 0 ? M_PKTHDR | M_NOFREE : M_NOFREE))
185338035ed6SNavdeep Parhar 			return (NULL);
185438035ed6SNavdeep Parhar 		fl->mbuf_inlined++;
1855b741402cSNavdeep Parhar 		m_extaddref(m, payload, blen, &clm->refcount, rxb_free,
185638035ed6SNavdeep Parhar 		    swz->zone, sd->cl);
185782eff304SNavdeep Parhar 		if (sd->nmbuf++ == 0)
185882eff304SNavdeep Parhar 			counter_u64_add(extfree_refs, 1);
185938035ed6SNavdeep Parhar 
186038035ed6SNavdeep Parhar 	} else {
186138035ed6SNavdeep Parhar 
186238035ed6SNavdeep Parhar 		/*
186338035ed6SNavdeep Parhar 		 * Grab an mbuf from zone_mbuf and associate it with the
186438035ed6SNavdeep Parhar 		 * payload in the cluster.
186538035ed6SNavdeep Parhar 		 */
186638035ed6SNavdeep Parhar 
1867b741402cSNavdeep Parhar 		m = fr_offset == 0 ?
186838035ed6SNavdeep Parhar 		    m_gethdr(M_NOWAIT, MT_DATA) : m_get(M_NOWAIT, MT_DATA);
186938035ed6SNavdeep Parhar 		if (m == NULL)
187038035ed6SNavdeep Parhar 			return (NULL);
187138035ed6SNavdeep Parhar 		fl->mbuf_allocated++;
1872ccc69b2fSNavdeep Parhar 		if (clm != NULL) {
1873b741402cSNavdeep Parhar 			m_extaddref(m, payload, blen, &clm->refcount,
187438035ed6SNavdeep Parhar 			    rxb_free, swz->zone, sd->cl);
187582eff304SNavdeep Parhar 			if (sd->nmbuf++ == 0)
187682eff304SNavdeep Parhar 				counter_u64_add(extfree_refs, 1);
1877ccc69b2fSNavdeep Parhar 		} else {
187838035ed6SNavdeep Parhar 			m_cljset(m, sd->cl, swz->type);
187938035ed6SNavdeep Parhar 			sd->cl = NULL;	/* consumed, not a recycle candidate */
188038035ed6SNavdeep Parhar 		}
188138035ed6SNavdeep Parhar 	}
1882b741402cSNavdeep Parhar 	if (fr_offset == 0)
1883b741402cSNavdeep Parhar 		m->m_pkthdr.len = remaining;
188438035ed6SNavdeep Parhar 	m->m_len = len;
188538035ed6SNavdeep Parhar 
188638035ed6SNavdeep Parhar 	if (fl->flags & FL_BUF_PACKING) {
1887b741402cSNavdeep Parhar 		fl->rx_offset += blen;
188838035ed6SNavdeep Parhar 		MPASS(fl->rx_offset <= hwb->size);
188938035ed6SNavdeep Parhar 		if (fl->rx_offset < hwb->size)
189038035ed6SNavdeep Parhar 			return (m);	/* without advancing the cidx */
189138035ed6SNavdeep Parhar 	}
189238035ed6SNavdeep Parhar 
18934d6db4e0SNavdeep Parhar 	if (__predict_false(++fl->cidx % 8 == 0)) {
18944d6db4e0SNavdeep Parhar 		uint16_t cidx = fl->cidx / 8;
18954d6db4e0SNavdeep Parhar 
18964d6db4e0SNavdeep Parhar 		if (__predict_false(cidx == fl->sidx))
18974d6db4e0SNavdeep Parhar 			fl->cidx = cidx = 0;
18984d6db4e0SNavdeep Parhar 		fl->hw_cidx = cidx;
18994d6db4e0SNavdeep Parhar 	}
190038035ed6SNavdeep Parhar 	fl->rx_offset = 0;
190138035ed6SNavdeep Parhar 
190238035ed6SNavdeep Parhar 	return (m);
190338035ed6SNavdeep Parhar }
190438035ed6SNavdeep Parhar 
190538035ed6SNavdeep Parhar static struct mbuf *
19064d6db4e0SNavdeep Parhar get_fl_payload(struct adapter *sc, struct sge_fl *fl, uint32_t len_newbuf)
19071458bff9SNavdeep Parhar {
190838035ed6SNavdeep Parhar 	struct mbuf *m0, *m, **pnext;
1909b741402cSNavdeep Parhar 	u_int remaining;
1910b741402cSNavdeep Parhar 	const u_int total = G_RSPD_LEN(len_newbuf);
19111458bff9SNavdeep Parhar 
19124d6db4e0SNavdeep Parhar 	if (__predict_false(fl->flags & FL_BUF_RESUME)) {
1913368541baSNavdeep Parhar 		M_ASSERTPKTHDR(fl->m0);
1914b741402cSNavdeep Parhar 		MPASS(fl->m0->m_pkthdr.len == total);
1915b741402cSNavdeep Parhar 		MPASS(fl->remaining < total);
19161458bff9SNavdeep Parhar 
191738035ed6SNavdeep Parhar 		m0 = fl->m0;
191838035ed6SNavdeep Parhar 		pnext = fl->pnext;
1919b741402cSNavdeep Parhar 		remaining = fl->remaining;
19204d6db4e0SNavdeep Parhar 		fl->flags &= ~FL_BUF_RESUME;
192138035ed6SNavdeep Parhar 		goto get_segment;
19221458bff9SNavdeep Parhar 	}
19231458bff9SNavdeep Parhar 
192438035ed6SNavdeep Parhar 	if (fl->rx_offset > 0 && len_newbuf & F_RSPD_NEWBUF) {
19251458bff9SNavdeep Parhar 		fl->rx_offset = 0;
19264d6db4e0SNavdeep Parhar 		if (__predict_false(++fl->cidx % 8 == 0)) {
19274d6db4e0SNavdeep Parhar 			uint16_t cidx = fl->cidx / 8;
19284d6db4e0SNavdeep Parhar 
19294d6db4e0SNavdeep Parhar 			if (__predict_false(cidx == fl->sidx))
19304d6db4e0SNavdeep Parhar 				fl->cidx = cidx = 0;
19314d6db4e0SNavdeep Parhar 			fl->hw_cidx = cidx;
19324d6db4e0SNavdeep Parhar 		}
19331458bff9SNavdeep Parhar 	}
19341458bff9SNavdeep Parhar 
19351458bff9SNavdeep Parhar 	/*
193638035ed6SNavdeep Parhar 	 * Payload starts at rx_offset in the current hw buffer.  Its length is
193738035ed6SNavdeep Parhar 	 * 'len' and it may span multiple hw buffers.
19381458bff9SNavdeep Parhar 	 */
19391458bff9SNavdeep Parhar 
1940b741402cSNavdeep Parhar 	m0 = get_scatter_segment(sc, fl, 0, total);
1941368541baSNavdeep Parhar 	if (m0 == NULL)
19424d6db4e0SNavdeep Parhar 		return (NULL);
1943b741402cSNavdeep Parhar 	remaining = total - m0->m_len;
194438035ed6SNavdeep Parhar 	pnext = &m0->m_next;
1945b741402cSNavdeep Parhar 	while (remaining > 0) {
194638035ed6SNavdeep Parhar get_segment:
194738035ed6SNavdeep Parhar 		MPASS(fl->rx_offset == 0);
1948b741402cSNavdeep Parhar 		m = get_scatter_segment(sc, fl, total - remaining, remaining);
19494d6db4e0SNavdeep Parhar 		if (__predict_false(m == NULL)) {
195038035ed6SNavdeep Parhar 			fl->m0 = m0;
195138035ed6SNavdeep Parhar 			fl->pnext = pnext;
1952b741402cSNavdeep Parhar 			fl->remaining = remaining;
19534d6db4e0SNavdeep Parhar 			fl->flags |= FL_BUF_RESUME;
19544d6db4e0SNavdeep Parhar 			return (NULL);
19551458bff9SNavdeep Parhar 		}
195638035ed6SNavdeep Parhar 		*pnext = m;
195738035ed6SNavdeep Parhar 		pnext = &m->m_next;
1958b741402cSNavdeep Parhar 		remaining -= m->m_len;
1959733b9277SNavdeep Parhar 	}
196038035ed6SNavdeep Parhar 	*pnext = NULL;
19614d6db4e0SNavdeep Parhar 
1962dbbf46c4SNavdeep Parhar 	M_ASSERTPKTHDR(m0);
1963733b9277SNavdeep Parhar 	return (m0);
1964733b9277SNavdeep Parhar }
1965733b9277SNavdeep Parhar 
1966733b9277SNavdeep Parhar static int
1967733b9277SNavdeep Parhar t4_eth_rx(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m0)
1968733b9277SNavdeep Parhar {
19693c51d154SNavdeep Parhar 	struct sge_rxq *rxq = iq_to_rxq(iq);
1970733b9277SNavdeep Parhar 	struct ifnet *ifp = rxq->ifp;
197190e7434aSNavdeep Parhar 	struct adapter *sc = iq->adapter;
1972733b9277SNavdeep Parhar 	const struct cpl_rx_pkt *cpl = (const void *)(rss + 1);
1973a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
1974733b9277SNavdeep Parhar 	struct lro_ctrl *lro = &rxq->lro;
1975733b9277SNavdeep Parhar #endif
197670ca6229SNavdeep Parhar 	static const int sw_hashtype[4][2] = {
197770ca6229SNavdeep Parhar 		{M_HASHTYPE_NONE, M_HASHTYPE_NONE},
197870ca6229SNavdeep Parhar 		{M_HASHTYPE_RSS_IPV4, M_HASHTYPE_RSS_IPV6},
197970ca6229SNavdeep Parhar 		{M_HASHTYPE_RSS_TCP_IPV4, M_HASHTYPE_RSS_TCP_IPV6},
198070ca6229SNavdeep Parhar 		{M_HASHTYPE_RSS_UDP_IPV4, M_HASHTYPE_RSS_UDP_IPV6},
198170ca6229SNavdeep Parhar 	};
1982733b9277SNavdeep Parhar 
1983733b9277SNavdeep Parhar 	KASSERT(m0 != NULL, ("%s: no payload with opcode %02x", __func__,
1984733b9277SNavdeep Parhar 	    rss->opcode));
1985733b9277SNavdeep Parhar 
198690e7434aSNavdeep Parhar 	m0->m_pkthdr.len -= sc->params.sge.fl_pktshift;
198790e7434aSNavdeep Parhar 	m0->m_len -= sc->params.sge.fl_pktshift;
198890e7434aSNavdeep Parhar 	m0->m_data += sc->params.sge.fl_pktshift;
198954e4ee71SNavdeep Parhar 
199054e4ee71SNavdeep Parhar 	m0->m_pkthdr.rcvif = ifp;
199170ca6229SNavdeep Parhar 	M_HASHTYPE_SET(m0, sw_hashtype[rss->hash_type][rss->ipv6]);
1992273ef991SNavdeep Parhar 	m0->m_pkthdr.flowid = be32toh(rss->hash_val);
199354e4ee71SNavdeep Parhar 
19941de8c69dSNavdeep Parhar 	if (cpl->csum_calc && !(cpl->err_vec & sc->params.tp.err_vec_mask)) {
19959600bf00SNavdeep Parhar 		if (ifp->if_capenable & IFCAP_RXCSUM &&
19969600bf00SNavdeep Parhar 		    cpl->l2info & htobe32(F_RXF_IP)) {
1997932b1a5fSNavdeep Parhar 			m0->m_pkthdr.csum_flags = (CSUM_IP_CHECKED |
199854e4ee71SNavdeep Parhar 			    CSUM_IP_VALID | CSUM_DATA_VALID | CSUM_PSEUDO_HDR);
19999600bf00SNavdeep Parhar 			rxq->rxcsum++;
20009600bf00SNavdeep Parhar 		} else if (ifp->if_capenable & IFCAP_RXCSUM_IPV6 &&
20019600bf00SNavdeep Parhar 		    cpl->l2info & htobe32(F_RXF_IP6)) {
2002932b1a5fSNavdeep Parhar 			m0->m_pkthdr.csum_flags = (CSUM_DATA_VALID_IPV6 |
20039600bf00SNavdeep Parhar 			    CSUM_PSEUDO_HDR);
20049600bf00SNavdeep Parhar 			rxq->rxcsum++;
20059600bf00SNavdeep Parhar 		}
20069600bf00SNavdeep Parhar 
20079600bf00SNavdeep Parhar 		if (__predict_false(cpl->ip_frag))
200854e4ee71SNavdeep Parhar 			m0->m_pkthdr.csum_data = be16toh(cpl->csum);
200954e4ee71SNavdeep Parhar 		else
201054e4ee71SNavdeep Parhar 			m0->m_pkthdr.csum_data = 0xffff;
201154e4ee71SNavdeep Parhar 	}
201254e4ee71SNavdeep Parhar 
201354e4ee71SNavdeep Parhar 	if (cpl->vlan_ex) {
201454e4ee71SNavdeep Parhar 		m0->m_pkthdr.ether_vtag = be16toh(cpl->vlan);
201554e4ee71SNavdeep Parhar 		m0->m_flags |= M_VLANTAG;
201654e4ee71SNavdeep Parhar 		rxq->vlan_extraction++;
201754e4ee71SNavdeep Parhar 	}
201854e4ee71SNavdeep Parhar 
2019a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
202046f48ee5SNavdeep Parhar 	if (iq->flags & IQ_LRO_ENABLED) {
202146f48ee5SNavdeep Parhar 		if (sort_before_lro(lro)) {
202246f48ee5SNavdeep Parhar 			tcp_lro_queue_mbuf(lro, m0);
202346f48ee5SNavdeep Parhar 			return (0); /* queued for sort, then LRO */
202446f48ee5SNavdeep Parhar 		}
202546f48ee5SNavdeep Parhar 		if (tcp_lro_rx(lro, m0, 0) == 0)
202646f48ee5SNavdeep Parhar 			return (0); /* queued for LRO */
202746f48ee5SNavdeep Parhar 	}
202854e4ee71SNavdeep Parhar #endif
20297d29df59SNavdeep Parhar 	ifp->if_input(ifp, m0);
203054e4ee71SNavdeep Parhar 
2031733b9277SNavdeep Parhar 	return (0);
203254e4ee71SNavdeep Parhar }
203354e4ee71SNavdeep Parhar 
2034733b9277SNavdeep Parhar /*
20357951040fSNavdeep Parhar  * Must drain the wrq or make sure that someone else will.
20367951040fSNavdeep Parhar  */
20377951040fSNavdeep Parhar static void
20387951040fSNavdeep Parhar wrq_tx_drain(void *arg, int n)
20397951040fSNavdeep Parhar {
20407951040fSNavdeep Parhar 	struct sge_wrq *wrq = arg;
20417951040fSNavdeep Parhar 	struct sge_eq *eq = &wrq->eq;
20427951040fSNavdeep Parhar 
20437951040fSNavdeep Parhar 	EQ_LOCK(eq);
20447951040fSNavdeep Parhar 	if (TAILQ_EMPTY(&wrq->incomplete_wrs) && !STAILQ_EMPTY(&wrq->wr_list))
20457951040fSNavdeep Parhar 		drain_wrq_wr_list(wrq->adapter, wrq);
20467951040fSNavdeep Parhar 	EQ_UNLOCK(eq);
20477951040fSNavdeep Parhar }
20487951040fSNavdeep Parhar 
20497951040fSNavdeep Parhar static void
20507951040fSNavdeep Parhar drain_wrq_wr_list(struct adapter *sc, struct sge_wrq *wrq)
20517951040fSNavdeep Parhar {
20527951040fSNavdeep Parhar 	struct sge_eq *eq = &wrq->eq;
20537951040fSNavdeep Parhar 	u_int available, dbdiff;	/* # of hardware descriptors */
20547951040fSNavdeep Parhar 	u_int n;
20557951040fSNavdeep Parhar 	struct wrqe *wr;
20567951040fSNavdeep Parhar 	struct fw_eth_tx_pkt_wr *dst;	/* any fw WR struct will do */
20577951040fSNavdeep Parhar 
20587951040fSNavdeep Parhar 	EQ_LOCK_ASSERT_OWNED(eq);
20597951040fSNavdeep Parhar 	MPASS(TAILQ_EMPTY(&wrq->incomplete_wrs));
20607951040fSNavdeep Parhar 	wr = STAILQ_FIRST(&wrq->wr_list);
20617951040fSNavdeep Parhar 	MPASS(wr != NULL);	/* Must be called with something useful to do */
2062cda2ab0eSNavdeep Parhar 	MPASS(eq->pidx == eq->dbidx);
2063cda2ab0eSNavdeep Parhar 	dbdiff = 0;
20647951040fSNavdeep Parhar 
20657951040fSNavdeep Parhar 	do {
20667951040fSNavdeep Parhar 		eq->cidx = read_hw_cidx(eq);
20677951040fSNavdeep Parhar 		if (eq->pidx == eq->cidx)
20687951040fSNavdeep Parhar 			available = eq->sidx - 1;
20697951040fSNavdeep Parhar 		else
20707951040fSNavdeep Parhar 			available = IDXDIFF(eq->cidx, eq->pidx, eq->sidx) - 1;
20717951040fSNavdeep Parhar 
20727951040fSNavdeep Parhar 		MPASS(wr->wrq == wrq);
20737951040fSNavdeep Parhar 		n = howmany(wr->wr_len, EQ_ESIZE);
20747951040fSNavdeep Parhar 		if (available < n)
2075cda2ab0eSNavdeep Parhar 			break;
20767951040fSNavdeep Parhar 
20777951040fSNavdeep Parhar 		dst = (void *)&eq->desc[eq->pidx];
20787951040fSNavdeep Parhar 		if (__predict_true(eq->sidx - eq->pidx > n)) {
20797951040fSNavdeep Parhar 			/* Won't wrap, won't end exactly at the status page. */
20807951040fSNavdeep Parhar 			bcopy(&wr->wr[0], dst, wr->wr_len);
20817951040fSNavdeep Parhar 			eq->pidx += n;
20827951040fSNavdeep Parhar 		} else {
20837951040fSNavdeep Parhar 			int first_portion = (eq->sidx - eq->pidx) * EQ_ESIZE;
20847951040fSNavdeep Parhar 
20857951040fSNavdeep Parhar 			bcopy(&wr->wr[0], dst, first_portion);
20867951040fSNavdeep Parhar 			if (wr->wr_len > first_portion) {
20877951040fSNavdeep Parhar 				bcopy(&wr->wr[first_portion], &eq->desc[0],
20887951040fSNavdeep Parhar 				    wr->wr_len - first_portion);
20897951040fSNavdeep Parhar 			}
20907951040fSNavdeep Parhar 			eq->pidx = n - (eq->sidx - eq->pidx);
20917951040fSNavdeep Parhar 		}
20920459a175SNavdeep Parhar 		wrq->tx_wrs_copied++;
20937951040fSNavdeep Parhar 
20947951040fSNavdeep Parhar 		if (available < eq->sidx / 4 &&
20957951040fSNavdeep Parhar 		    atomic_cmpset_int(&eq->equiq, 0, 1)) {
2096ddf09ad6SNavdeep Parhar 				/*
2097ddf09ad6SNavdeep Parhar 				 * XXX: This is not 100% reliable with some
2098ddf09ad6SNavdeep Parhar 				 * types of WRs.  But this is a very unusual
2099ddf09ad6SNavdeep Parhar 				 * situation for an ofld/ctrl queue anyway.
2100ddf09ad6SNavdeep Parhar 				 */
21017951040fSNavdeep Parhar 			dst->equiq_to_len16 |= htobe32(F_FW_WR_EQUIQ |
21027951040fSNavdeep Parhar 			    F_FW_WR_EQUEQ);
21037951040fSNavdeep Parhar 		}
21047951040fSNavdeep Parhar 
21057951040fSNavdeep Parhar 		dbdiff += n;
21067951040fSNavdeep Parhar 		if (dbdiff >= 16) {
21077951040fSNavdeep Parhar 			ring_eq_db(sc, eq, dbdiff);
21087951040fSNavdeep Parhar 			dbdiff = 0;
21097951040fSNavdeep Parhar 		}
21107951040fSNavdeep Parhar 
21117951040fSNavdeep Parhar 		STAILQ_REMOVE_HEAD(&wrq->wr_list, link);
21127951040fSNavdeep Parhar 		free_wrqe(wr);
21137951040fSNavdeep Parhar 		MPASS(wrq->nwr_pending > 0);
21147951040fSNavdeep Parhar 		wrq->nwr_pending--;
21157951040fSNavdeep Parhar 		MPASS(wrq->ndesc_needed >= n);
21167951040fSNavdeep Parhar 		wrq->ndesc_needed -= n;
21177951040fSNavdeep Parhar 	} while ((wr = STAILQ_FIRST(&wrq->wr_list)) != NULL);
21187951040fSNavdeep Parhar 
21197951040fSNavdeep Parhar 	if (dbdiff)
21207951040fSNavdeep Parhar 		ring_eq_db(sc, eq, dbdiff);
21217951040fSNavdeep Parhar }
21227951040fSNavdeep Parhar 
21237951040fSNavdeep Parhar /*
2124733b9277SNavdeep Parhar  * Doesn't fail.  Holds on to work requests it can't send right away.
2125733b9277SNavdeep Parhar  */
212609fe6320SNavdeep Parhar void
212709fe6320SNavdeep Parhar t4_wrq_tx_locked(struct adapter *sc, struct sge_wrq *wrq, struct wrqe *wr)
2128733b9277SNavdeep Parhar {
2129733b9277SNavdeep Parhar #ifdef INVARIANTS
21307951040fSNavdeep Parhar 	struct sge_eq *eq = &wrq->eq;
2131733b9277SNavdeep Parhar #endif
2132733b9277SNavdeep Parhar 
21337951040fSNavdeep Parhar 	EQ_LOCK_ASSERT_OWNED(eq);
21347951040fSNavdeep Parhar 	MPASS(wr != NULL);
21357951040fSNavdeep Parhar 	MPASS(wr->wr_len > 0 && wr->wr_len <= SGE_MAX_WR_LEN);
21367951040fSNavdeep Parhar 	MPASS((wr->wr_len & 0x7) == 0);
2137733b9277SNavdeep Parhar 
21387951040fSNavdeep Parhar 	STAILQ_INSERT_TAIL(&wrq->wr_list, wr, link);
21397951040fSNavdeep Parhar 	wrq->nwr_pending++;
21407951040fSNavdeep Parhar 	wrq->ndesc_needed += howmany(wr->wr_len, EQ_ESIZE);
2141733b9277SNavdeep Parhar 
21427951040fSNavdeep Parhar 	if (!TAILQ_EMPTY(&wrq->incomplete_wrs))
21437951040fSNavdeep Parhar 		return;	/* commit_wrq_wr will drain wr_list as well. */
2144733b9277SNavdeep Parhar 
21457951040fSNavdeep Parhar 	drain_wrq_wr_list(sc, wrq);
2146733b9277SNavdeep Parhar 
21477951040fSNavdeep Parhar 	/* Doorbell must have caught up to the pidx. */
21487951040fSNavdeep Parhar 	MPASS(eq->pidx == eq->dbidx);
214954e4ee71SNavdeep Parhar }
215054e4ee71SNavdeep Parhar 
215154e4ee71SNavdeep Parhar void
215254e4ee71SNavdeep Parhar t4_update_fl_bufsize(struct ifnet *ifp)
215354e4ee71SNavdeep Parhar {
2154fe2ebb76SJohn Baldwin 	struct vi_info *vi = ifp->if_softc;
2155fe2ebb76SJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
215654e4ee71SNavdeep Parhar 	struct sge_rxq *rxq;
21576eb3180fSNavdeep Parhar #ifdef TCP_OFFLOAD
21586eb3180fSNavdeep Parhar 	struct sge_ofld_rxq *ofld_rxq;
21596eb3180fSNavdeep Parhar #endif
216054e4ee71SNavdeep Parhar 	struct sge_fl *fl;
216138035ed6SNavdeep Parhar 	int i, maxp, mtu = ifp->if_mtu;
216254e4ee71SNavdeep Parhar 
216338035ed6SNavdeep Parhar 	maxp = mtu_to_max_payload(sc, mtu, 0);
2164fe2ebb76SJohn Baldwin 	for_each_rxq(vi, i, rxq) {
216554e4ee71SNavdeep Parhar 		fl = &rxq->fl;
216654e4ee71SNavdeep Parhar 
216754e4ee71SNavdeep Parhar 		FL_LOCK(fl);
216838035ed6SNavdeep Parhar 		find_best_refill_source(sc, fl, maxp);
216954e4ee71SNavdeep Parhar 		FL_UNLOCK(fl);
217054e4ee71SNavdeep Parhar 	}
21716eb3180fSNavdeep Parhar #ifdef TCP_OFFLOAD
217238035ed6SNavdeep Parhar 	maxp = mtu_to_max_payload(sc, mtu, 1);
2173fe2ebb76SJohn Baldwin 	for_each_ofld_rxq(vi, i, ofld_rxq) {
21746eb3180fSNavdeep Parhar 		fl = &ofld_rxq->fl;
21756eb3180fSNavdeep Parhar 
21766eb3180fSNavdeep Parhar 		FL_LOCK(fl);
217738035ed6SNavdeep Parhar 		find_best_refill_source(sc, fl, maxp);
21786eb3180fSNavdeep Parhar 		FL_UNLOCK(fl);
21796eb3180fSNavdeep Parhar 	}
21806eb3180fSNavdeep Parhar #endif
218154e4ee71SNavdeep Parhar }
218254e4ee71SNavdeep Parhar 
21837951040fSNavdeep Parhar static inline int
21847951040fSNavdeep Parhar mbuf_nsegs(struct mbuf *m)
2185733b9277SNavdeep Parhar {
21860835ddc7SNavdeep Parhar 
21877951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
21887951040fSNavdeep Parhar 	KASSERT(m->m_pkthdr.l5hlen > 0,
21897951040fSNavdeep Parhar 	    ("%s: mbuf %p missing information on # of segments.", __func__, m));
21907951040fSNavdeep Parhar 
21917951040fSNavdeep Parhar 	return (m->m_pkthdr.l5hlen);
21927951040fSNavdeep Parhar }
21937951040fSNavdeep Parhar 
21947951040fSNavdeep Parhar static inline void
21957951040fSNavdeep Parhar set_mbuf_nsegs(struct mbuf *m, uint8_t nsegs)
21967951040fSNavdeep Parhar {
21977951040fSNavdeep Parhar 
21987951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
21997951040fSNavdeep Parhar 	m->m_pkthdr.l5hlen = nsegs;
22007951040fSNavdeep Parhar }
22017951040fSNavdeep Parhar 
22027951040fSNavdeep Parhar static inline int
2203*5cdaef71SJohn Baldwin mbuf_cflags(struct mbuf *m)
2204*5cdaef71SJohn Baldwin {
2205*5cdaef71SJohn Baldwin 
2206*5cdaef71SJohn Baldwin 	M_ASSERTPKTHDR(m);
2207*5cdaef71SJohn Baldwin 	return (m->m_pkthdr.PH_loc.eight[4]);
2208*5cdaef71SJohn Baldwin }
2209*5cdaef71SJohn Baldwin 
2210*5cdaef71SJohn Baldwin static inline void
2211*5cdaef71SJohn Baldwin set_mbuf_cflags(struct mbuf *m, uint8_t flags)
2212*5cdaef71SJohn Baldwin {
2213*5cdaef71SJohn Baldwin 
2214*5cdaef71SJohn Baldwin 	M_ASSERTPKTHDR(m);
2215*5cdaef71SJohn Baldwin 	m->m_pkthdr.PH_loc.eight[4] = flags;
2216*5cdaef71SJohn Baldwin }
2217*5cdaef71SJohn Baldwin 
2218*5cdaef71SJohn Baldwin static inline int
22197951040fSNavdeep Parhar mbuf_len16(struct mbuf *m)
22207951040fSNavdeep Parhar {
22217951040fSNavdeep Parhar 	int n;
22227951040fSNavdeep Parhar 
22237951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
22247951040fSNavdeep Parhar 	n = m->m_pkthdr.PH_loc.eight[0];
22257951040fSNavdeep Parhar 	MPASS(n > 0 && n <= SGE_MAX_WR_LEN / 16);
22267951040fSNavdeep Parhar 
22277951040fSNavdeep Parhar 	return (n);
22287951040fSNavdeep Parhar }
22297951040fSNavdeep Parhar 
22307951040fSNavdeep Parhar static inline void
22317951040fSNavdeep Parhar set_mbuf_len16(struct mbuf *m, uint8_t len16)
22327951040fSNavdeep Parhar {
22337951040fSNavdeep Parhar 
22347951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
22357951040fSNavdeep Parhar 	m->m_pkthdr.PH_loc.eight[0] = len16;
22367951040fSNavdeep Parhar }
22377951040fSNavdeep Parhar 
2238786099deSNavdeep Parhar #ifdef RATELIMIT
2239786099deSNavdeep Parhar static inline int
2240786099deSNavdeep Parhar mbuf_eo_nsegs(struct mbuf *m)
2241786099deSNavdeep Parhar {
2242786099deSNavdeep Parhar 
2243786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2244786099deSNavdeep Parhar 	return (m->m_pkthdr.PH_loc.eight[1]);
2245786099deSNavdeep Parhar }
2246786099deSNavdeep Parhar 
2247786099deSNavdeep Parhar static inline void
2248786099deSNavdeep Parhar set_mbuf_eo_nsegs(struct mbuf *m, uint8_t nsegs)
2249786099deSNavdeep Parhar {
2250786099deSNavdeep Parhar 
2251786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2252786099deSNavdeep Parhar 	m->m_pkthdr.PH_loc.eight[1] = nsegs;
2253786099deSNavdeep Parhar }
2254786099deSNavdeep Parhar 
2255786099deSNavdeep Parhar static inline int
2256786099deSNavdeep Parhar mbuf_eo_len16(struct mbuf *m)
2257786099deSNavdeep Parhar {
2258786099deSNavdeep Parhar 	int n;
2259786099deSNavdeep Parhar 
2260786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2261786099deSNavdeep Parhar 	n = m->m_pkthdr.PH_loc.eight[2];
2262786099deSNavdeep Parhar 	MPASS(n > 0 && n <= SGE_MAX_WR_LEN / 16);
2263786099deSNavdeep Parhar 
2264786099deSNavdeep Parhar 	return (n);
2265786099deSNavdeep Parhar }
2266786099deSNavdeep Parhar 
2267786099deSNavdeep Parhar static inline void
2268786099deSNavdeep Parhar set_mbuf_eo_len16(struct mbuf *m, uint8_t len16)
2269786099deSNavdeep Parhar {
2270786099deSNavdeep Parhar 
2271786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2272786099deSNavdeep Parhar 	m->m_pkthdr.PH_loc.eight[2] = len16;
2273786099deSNavdeep Parhar }
2274786099deSNavdeep Parhar 
2275786099deSNavdeep Parhar static inline int
2276786099deSNavdeep Parhar mbuf_eo_tsclk_tsoff(struct mbuf *m)
2277786099deSNavdeep Parhar {
2278786099deSNavdeep Parhar 
2279786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2280786099deSNavdeep Parhar 	return (m->m_pkthdr.PH_loc.eight[3]);
2281786099deSNavdeep Parhar }
2282786099deSNavdeep Parhar 
2283786099deSNavdeep Parhar static inline void
2284786099deSNavdeep Parhar set_mbuf_eo_tsclk_tsoff(struct mbuf *m, uint8_t tsclk_tsoff)
2285786099deSNavdeep Parhar {
2286786099deSNavdeep Parhar 
2287786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2288786099deSNavdeep Parhar 	m->m_pkthdr.PH_loc.eight[3] = tsclk_tsoff;
2289786099deSNavdeep Parhar }
2290786099deSNavdeep Parhar 
2291786099deSNavdeep Parhar static inline int
2292786099deSNavdeep Parhar needs_eo(struct mbuf *m)
2293786099deSNavdeep Parhar {
2294786099deSNavdeep Parhar 
2295786099deSNavdeep Parhar 	return (m->m_pkthdr.snd_tag != NULL);
2296786099deSNavdeep Parhar }
2297786099deSNavdeep Parhar #endif
2298786099deSNavdeep Parhar 
2299*5cdaef71SJohn Baldwin /*
2300*5cdaef71SJohn Baldwin  * Try to allocate an mbuf to contain a raw work request.  To make it
2301*5cdaef71SJohn Baldwin  * easy to construct the work request, don't allocate a chain but a
2302*5cdaef71SJohn Baldwin  * single mbuf.
2303*5cdaef71SJohn Baldwin  */
2304*5cdaef71SJohn Baldwin struct mbuf *
2305*5cdaef71SJohn Baldwin alloc_wr_mbuf(int len, int how)
2306*5cdaef71SJohn Baldwin {
2307*5cdaef71SJohn Baldwin 	struct mbuf *m;
2308*5cdaef71SJohn Baldwin 
2309*5cdaef71SJohn Baldwin 	if (len <= MHLEN)
2310*5cdaef71SJohn Baldwin 		m = m_gethdr(how, MT_DATA);
2311*5cdaef71SJohn Baldwin 	else if (len <= MCLBYTES)
2312*5cdaef71SJohn Baldwin 		m = m_getcl(how, MT_DATA, M_PKTHDR);
2313*5cdaef71SJohn Baldwin 	else
2314*5cdaef71SJohn Baldwin 		m = NULL;
2315*5cdaef71SJohn Baldwin 	if (m == NULL)
2316*5cdaef71SJohn Baldwin 		return (NULL);
2317*5cdaef71SJohn Baldwin 	m->m_pkthdr.len = len;
2318*5cdaef71SJohn Baldwin 	m->m_len = len;
2319*5cdaef71SJohn Baldwin 	set_mbuf_cflags(m, MC_RAW_WR);
2320*5cdaef71SJohn Baldwin 	set_mbuf_len16(m, howmany(len, 16));
2321*5cdaef71SJohn Baldwin 	return (m);
2322*5cdaef71SJohn Baldwin }
2323*5cdaef71SJohn Baldwin 
23247951040fSNavdeep Parhar static inline int
23257951040fSNavdeep Parhar needs_tso(struct mbuf *m)
23267951040fSNavdeep Parhar {
23277951040fSNavdeep Parhar 
23287951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
23297951040fSNavdeep Parhar 
2330a6a8ff35SNavdeep Parhar 	return (m->m_pkthdr.csum_flags & CSUM_TSO);
23317951040fSNavdeep Parhar }
23327951040fSNavdeep Parhar 
23337951040fSNavdeep Parhar static inline int
23347951040fSNavdeep Parhar needs_l3_csum(struct mbuf *m)
23357951040fSNavdeep Parhar {
23367951040fSNavdeep Parhar 
23377951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
23387951040fSNavdeep Parhar 
2339a6a8ff35SNavdeep Parhar 	return (m->m_pkthdr.csum_flags & (CSUM_IP | CSUM_TSO));
23407951040fSNavdeep Parhar }
23417951040fSNavdeep Parhar 
23427951040fSNavdeep Parhar static inline int
23437951040fSNavdeep Parhar needs_l4_csum(struct mbuf *m)
23447951040fSNavdeep Parhar {
23457951040fSNavdeep Parhar 
23467951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
23477951040fSNavdeep Parhar 
2348a6a8ff35SNavdeep Parhar 	return (m->m_pkthdr.csum_flags & (CSUM_TCP | CSUM_UDP | CSUM_UDP_IPV6 |
2349a6a8ff35SNavdeep Parhar 	    CSUM_TCP_IPV6 | CSUM_TSO));
23507951040fSNavdeep Parhar }
23517951040fSNavdeep Parhar 
23527951040fSNavdeep Parhar static inline int
2353786099deSNavdeep Parhar needs_tcp_csum(struct mbuf *m)
2354786099deSNavdeep Parhar {
2355786099deSNavdeep Parhar 
2356786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2357786099deSNavdeep Parhar 	return (m->m_pkthdr.csum_flags & (CSUM_TCP | CSUM_TCP_IPV6 | CSUM_TSO));
2358786099deSNavdeep Parhar }
2359786099deSNavdeep Parhar 
2360c3fce948SNavdeep Parhar #ifdef RATELIMIT
2361786099deSNavdeep Parhar static inline int
2362786099deSNavdeep Parhar needs_udp_csum(struct mbuf *m)
2363786099deSNavdeep Parhar {
2364786099deSNavdeep Parhar 
2365786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2366786099deSNavdeep Parhar 	return (m->m_pkthdr.csum_flags & (CSUM_UDP | CSUM_UDP_IPV6));
2367786099deSNavdeep Parhar }
2368c3fce948SNavdeep Parhar #endif
2369786099deSNavdeep Parhar 
2370786099deSNavdeep Parhar static inline int
23717951040fSNavdeep Parhar needs_vlan_insertion(struct mbuf *m)
23727951040fSNavdeep Parhar {
23737951040fSNavdeep Parhar 
23747951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
23757951040fSNavdeep Parhar 
2376a6a8ff35SNavdeep Parhar 	return (m->m_flags & M_VLANTAG);
23777951040fSNavdeep Parhar }
23787951040fSNavdeep Parhar 
23797951040fSNavdeep Parhar static void *
23807951040fSNavdeep Parhar m_advance(struct mbuf **pm, int *poffset, int len)
23817951040fSNavdeep Parhar {
23827951040fSNavdeep Parhar 	struct mbuf *m = *pm;
23837951040fSNavdeep Parhar 	int offset = *poffset;
23847951040fSNavdeep Parhar 	uintptr_t p = 0;
23857951040fSNavdeep Parhar 
23867951040fSNavdeep Parhar 	MPASS(len > 0);
23877951040fSNavdeep Parhar 
2388e06ab612SJohn Baldwin 	for (;;) {
23897951040fSNavdeep Parhar 		if (offset + len < m->m_len) {
23907951040fSNavdeep Parhar 			offset += len;
23917951040fSNavdeep Parhar 			p = mtod(m, uintptr_t) + offset;
23927951040fSNavdeep Parhar 			break;
23937951040fSNavdeep Parhar 		}
23947951040fSNavdeep Parhar 		len -= m->m_len - offset;
23957951040fSNavdeep Parhar 		m = m->m_next;
23967951040fSNavdeep Parhar 		offset = 0;
23977951040fSNavdeep Parhar 		MPASS(m != NULL);
23987951040fSNavdeep Parhar 	}
23997951040fSNavdeep Parhar 	*poffset = offset;
24007951040fSNavdeep Parhar 	*pm = m;
24017951040fSNavdeep Parhar 	return ((void *)p);
24027951040fSNavdeep Parhar }
24037951040fSNavdeep Parhar 
24047951040fSNavdeep Parhar /*
24057951040fSNavdeep Parhar  * Can deal with empty mbufs in the chain that have m_len = 0, but the chain
2406786099deSNavdeep Parhar  * must have at least one mbuf that's not empty.  It is possible for this
2407786099deSNavdeep Parhar  * routine to return 0 if skip accounts for all the contents of the mbuf chain.
24087951040fSNavdeep Parhar  */
24097951040fSNavdeep Parhar static inline int
2410786099deSNavdeep Parhar count_mbuf_nsegs(struct mbuf *m, int skip)
24117951040fSNavdeep Parhar {
241277e9044cSNavdeep Parhar 	vm_paddr_t lastb, next;
241377e9044cSNavdeep Parhar 	vm_offset_t va;
24147951040fSNavdeep Parhar 	int len, nsegs;
24157951040fSNavdeep Parhar 
2416786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m);
2417786099deSNavdeep Parhar 	MPASS(m->m_pkthdr.len > 0);
2418786099deSNavdeep Parhar 	MPASS(m->m_pkthdr.len >= skip);
24197951040fSNavdeep Parhar 
24207951040fSNavdeep Parhar 	nsegs = 0;
242177e9044cSNavdeep Parhar 	lastb = 0;
24227951040fSNavdeep Parhar 	for (; m; m = m->m_next) {
24237951040fSNavdeep Parhar 
24247951040fSNavdeep Parhar 		len = m->m_len;
24257951040fSNavdeep Parhar 		if (__predict_false(len == 0))
24267951040fSNavdeep Parhar 			continue;
2427786099deSNavdeep Parhar 		if (skip >= len) {
2428786099deSNavdeep Parhar 			skip -= len;
2429786099deSNavdeep Parhar 			continue;
2430786099deSNavdeep Parhar 		}
2431786099deSNavdeep Parhar 		va = mtod(m, vm_offset_t) + skip;
2432786099deSNavdeep Parhar 		len -= skip;
2433786099deSNavdeep Parhar 		skip = 0;
243477e9044cSNavdeep Parhar 		next = pmap_kextract(va);
2435786099deSNavdeep Parhar 		nsegs += sglist_count((void *)(uintptr_t)va, len);
243677e9044cSNavdeep Parhar 		if (lastb + 1 == next)
24377951040fSNavdeep Parhar 			nsegs--;
243877e9044cSNavdeep Parhar 		lastb = pmap_kextract(va + len - 1);
24397951040fSNavdeep Parhar 	}
24407951040fSNavdeep Parhar 
24417951040fSNavdeep Parhar 	return (nsegs);
24427951040fSNavdeep Parhar }
24437951040fSNavdeep Parhar 
24447951040fSNavdeep Parhar /*
24457951040fSNavdeep Parhar  * Analyze the mbuf to determine its tx needs.  The mbuf passed in may change:
24467951040fSNavdeep Parhar  * a) caller can assume it's been freed if this function returns with an error.
24477951040fSNavdeep Parhar  * b) it may get defragged up if the gather list is too long for the hardware.
24487951040fSNavdeep Parhar  */
24497951040fSNavdeep Parhar int
24506af45170SJohn Baldwin parse_pkt(struct adapter *sc, struct mbuf **mp)
24517951040fSNavdeep Parhar {
24527951040fSNavdeep Parhar 	struct mbuf *m0 = *mp, *m;
24537951040fSNavdeep Parhar 	int rc, nsegs, defragged = 0, offset;
24547951040fSNavdeep Parhar 	struct ether_header *eh;
24557951040fSNavdeep Parhar 	void *l3hdr;
24567951040fSNavdeep Parhar #if defined(INET) || defined(INET6)
24577951040fSNavdeep Parhar 	struct tcphdr *tcp;
24587951040fSNavdeep Parhar #endif
24597951040fSNavdeep Parhar 	uint16_t eh_type;
24607951040fSNavdeep Parhar 
24617951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m0);
24627951040fSNavdeep Parhar 	if (__predict_false(m0->m_pkthdr.len < ETHER_HDR_LEN)) {
24637951040fSNavdeep Parhar 		rc = EINVAL;
24647951040fSNavdeep Parhar fail:
24657951040fSNavdeep Parhar 		m_freem(m0);
24667951040fSNavdeep Parhar 		*mp = NULL;
24677951040fSNavdeep Parhar 		return (rc);
24687951040fSNavdeep Parhar 	}
24697951040fSNavdeep Parhar restart:
24707951040fSNavdeep Parhar 	/*
24717951040fSNavdeep Parhar 	 * First count the number of gather list segments in the payload.
24727951040fSNavdeep Parhar 	 * Defrag the mbuf if nsegs exceeds the hardware limit.
24737951040fSNavdeep Parhar 	 */
24747951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m0);
24757951040fSNavdeep Parhar 	MPASS(m0->m_pkthdr.len > 0);
2476786099deSNavdeep Parhar 	nsegs = count_mbuf_nsegs(m0, 0);
24777951040fSNavdeep Parhar 	if (nsegs > (needs_tso(m0) ? TX_SGL_SEGS_TSO : TX_SGL_SEGS)) {
24787951040fSNavdeep Parhar 		if (defragged++ > 0 || (m = m_defrag(m0, M_NOWAIT)) == NULL) {
24797951040fSNavdeep Parhar 			rc = EFBIG;
24807951040fSNavdeep Parhar 			goto fail;
24817951040fSNavdeep Parhar 		}
24827951040fSNavdeep Parhar 		*mp = m0 = m;	/* update caller's copy after defrag */
24837951040fSNavdeep Parhar 		goto restart;
24847951040fSNavdeep Parhar 	}
24857951040fSNavdeep Parhar 
24867951040fSNavdeep Parhar 	if (__predict_false(nsegs > 2 && m0->m_pkthdr.len <= MHLEN)) {
24877951040fSNavdeep Parhar 		m0 = m_pullup(m0, m0->m_pkthdr.len);
24887951040fSNavdeep Parhar 		if (m0 == NULL) {
24897951040fSNavdeep Parhar 			/* Should have left well enough alone. */
24907951040fSNavdeep Parhar 			rc = EFBIG;
24917951040fSNavdeep Parhar 			goto fail;
24927951040fSNavdeep Parhar 		}
24937951040fSNavdeep Parhar 		*mp = m0;	/* update caller's copy after pullup */
24947951040fSNavdeep Parhar 		goto restart;
24957951040fSNavdeep Parhar 	}
24967951040fSNavdeep Parhar 	set_mbuf_nsegs(m0, nsegs);
2497*5cdaef71SJohn Baldwin 	set_mbuf_cflags(m0, 0);
24986af45170SJohn Baldwin 	if (sc->flags & IS_VF)
24996af45170SJohn Baldwin 		set_mbuf_len16(m0, txpkt_vm_len16(nsegs, needs_tso(m0)));
25006af45170SJohn Baldwin 	else
25017951040fSNavdeep Parhar 		set_mbuf_len16(m0, txpkt_len16(nsegs, needs_tso(m0)));
25027951040fSNavdeep Parhar 
2503786099deSNavdeep Parhar #ifdef RATELIMIT
2504786099deSNavdeep Parhar 	/*
2505786099deSNavdeep Parhar 	 * Ethofld is limited to TCP and UDP for now, and only when L4 hw
2506786099deSNavdeep Parhar 	 * checksumming is enabled.  needs_l4_csum happens to check for all the
2507786099deSNavdeep Parhar 	 * right things.
2508786099deSNavdeep Parhar 	 */
2509786099deSNavdeep Parhar 	if (__predict_false(needs_eo(m0) && !needs_l4_csum(m0)))
2510786099deSNavdeep Parhar 		m0->m_pkthdr.snd_tag = NULL;
2511786099deSNavdeep Parhar #endif
2512786099deSNavdeep Parhar 
25136af45170SJohn Baldwin 	if (!needs_tso(m0) &&
2514786099deSNavdeep Parhar #ifdef RATELIMIT
2515786099deSNavdeep Parhar 	    !needs_eo(m0) &&
2516786099deSNavdeep Parhar #endif
25176af45170SJohn Baldwin 	    !(sc->flags & IS_VF && (needs_l3_csum(m0) || needs_l4_csum(m0))))
25187951040fSNavdeep Parhar 		return (0);
25197951040fSNavdeep Parhar 
25207951040fSNavdeep Parhar 	m = m0;
25217951040fSNavdeep Parhar 	eh = mtod(m, struct ether_header *);
25227951040fSNavdeep Parhar 	eh_type = ntohs(eh->ether_type);
25237951040fSNavdeep Parhar 	if (eh_type == ETHERTYPE_VLAN) {
25247951040fSNavdeep Parhar 		struct ether_vlan_header *evh = (void *)eh;
25257951040fSNavdeep Parhar 
25267951040fSNavdeep Parhar 		eh_type = ntohs(evh->evl_proto);
25277951040fSNavdeep Parhar 		m0->m_pkthdr.l2hlen = sizeof(*evh);
25287951040fSNavdeep Parhar 	} else
25297951040fSNavdeep Parhar 		m0->m_pkthdr.l2hlen = sizeof(*eh);
25307951040fSNavdeep Parhar 
25317951040fSNavdeep Parhar 	offset = 0;
25327951040fSNavdeep Parhar 	l3hdr = m_advance(&m, &offset, m0->m_pkthdr.l2hlen);
25337951040fSNavdeep Parhar 
25347951040fSNavdeep Parhar 	switch (eh_type) {
25357951040fSNavdeep Parhar #ifdef INET6
25367951040fSNavdeep Parhar 	case ETHERTYPE_IPV6:
25377951040fSNavdeep Parhar 	{
25387951040fSNavdeep Parhar 		struct ip6_hdr *ip6 = l3hdr;
25397951040fSNavdeep Parhar 
25406af45170SJohn Baldwin 		MPASS(!needs_tso(m0) || ip6->ip6_nxt == IPPROTO_TCP);
25417951040fSNavdeep Parhar 
25427951040fSNavdeep Parhar 		m0->m_pkthdr.l3hlen = sizeof(*ip6);
25437951040fSNavdeep Parhar 		break;
25447951040fSNavdeep Parhar 	}
25457951040fSNavdeep Parhar #endif
25467951040fSNavdeep Parhar #ifdef INET
25477951040fSNavdeep Parhar 	case ETHERTYPE_IP:
25487951040fSNavdeep Parhar 	{
25497951040fSNavdeep Parhar 		struct ip *ip = l3hdr;
25507951040fSNavdeep Parhar 
25517951040fSNavdeep Parhar 		m0->m_pkthdr.l3hlen = ip->ip_hl * 4;
25527951040fSNavdeep Parhar 		break;
25537951040fSNavdeep Parhar 	}
25547951040fSNavdeep Parhar #endif
25557951040fSNavdeep Parhar 	default:
25567951040fSNavdeep Parhar 		panic("%s: ethertype 0x%04x unknown.  if_cxgbe must be compiled"
25577951040fSNavdeep Parhar 		    " with the same INET/INET6 options as the kernel.",
25587951040fSNavdeep Parhar 		    __func__, eh_type);
25597951040fSNavdeep Parhar 	}
25607951040fSNavdeep Parhar 
25617951040fSNavdeep Parhar #if defined(INET) || defined(INET6)
2562786099deSNavdeep Parhar 	if (needs_tcp_csum(m0)) {
25637951040fSNavdeep Parhar 		tcp = m_advance(&m, &offset, m0->m_pkthdr.l3hlen);
25647951040fSNavdeep Parhar 		m0->m_pkthdr.l4hlen = tcp->th_off * 4;
2565786099deSNavdeep Parhar #ifdef RATELIMIT
2566786099deSNavdeep Parhar 		if (tsclk >= 0 && *(uint32_t *)(tcp + 1) == ntohl(0x0101080a)) {
2567786099deSNavdeep Parhar 			set_mbuf_eo_tsclk_tsoff(m0,
2568786099deSNavdeep Parhar 			    V_FW_ETH_TX_EO_WR_TSCLK(tsclk) |
2569786099deSNavdeep Parhar 			    V_FW_ETH_TX_EO_WR_TSOFF(sizeof(*tcp) / 2 + 1));
2570786099deSNavdeep Parhar 		} else
2571786099deSNavdeep Parhar 			set_mbuf_eo_tsclk_tsoff(m0, 0);
2572786099deSNavdeep Parhar 	} else if (needs_udp_csum(m)) {
2573786099deSNavdeep Parhar 		m0->m_pkthdr.l4hlen = sizeof(struct udphdr);
2574786099deSNavdeep Parhar #endif
25756af45170SJohn Baldwin 	}
2576786099deSNavdeep Parhar #ifdef RATELIMIT
2577786099deSNavdeep Parhar 	if (needs_eo(m0)) {
2578786099deSNavdeep Parhar 		u_int immhdrs;
2579786099deSNavdeep Parhar 
2580786099deSNavdeep Parhar 		/* EO WRs have the headers in the WR and not the GL. */
2581786099deSNavdeep Parhar 		immhdrs = m0->m_pkthdr.l2hlen + m0->m_pkthdr.l3hlen +
2582786099deSNavdeep Parhar 		    m0->m_pkthdr.l4hlen;
2583786099deSNavdeep Parhar 		nsegs = count_mbuf_nsegs(m0, immhdrs);
2584786099deSNavdeep Parhar 		set_mbuf_eo_nsegs(m0, nsegs);
2585786099deSNavdeep Parhar 		set_mbuf_eo_len16(m0,
2586786099deSNavdeep Parhar 		    txpkt_eo_len16(nsegs, immhdrs, needs_tso(m0)));
2587786099deSNavdeep Parhar 	}
2588786099deSNavdeep Parhar #endif
25897951040fSNavdeep Parhar #endif
25907951040fSNavdeep Parhar 	MPASS(m0 == *mp);
25917951040fSNavdeep Parhar 	return (0);
25927951040fSNavdeep Parhar }
25937951040fSNavdeep Parhar 
25947951040fSNavdeep Parhar void *
25957951040fSNavdeep Parhar start_wrq_wr(struct sge_wrq *wrq, int len16, struct wrq_cookie *cookie)
25967951040fSNavdeep Parhar {
25977951040fSNavdeep Parhar 	struct sge_eq *eq = &wrq->eq;
25987951040fSNavdeep Parhar 	struct adapter *sc = wrq->adapter;
25997951040fSNavdeep Parhar 	int ndesc, available;
26007951040fSNavdeep Parhar 	struct wrqe *wr;
26017951040fSNavdeep Parhar 	void *w;
26027951040fSNavdeep Parhar 
26037951040fSNavdeep Parhar 	MPASS(len16 > 0);
26047951040fSNavdeep Parhar 	ndesc = howmany(len16, EQ_ESIZE / 16);
26057951040fSNavdeep Parhar 	MPASS(ndesc > 0 && ndesc <= SGE_MAX_WR_NDESC);
26067951040fSNavdeep Parhar 
26077951040fSNavdeep Parhar 	EQ_LOCK(eq);
26087951040fSNavdeep Parhar 
26098d6ae10aSNavdeep Parhar 	if (TAILQ_EMPTY(&wrq->incomplete_wrs) && !STAILQ_EMPTY(&wrq->wr_list))
26107951040fSNavdeep Parhar 		drain_wrq_wr_list(sc, wrq);
26117951040fSNavdeep Parhar 
26127951040fSNavdeep Parhar 	if (!STAILQ_EMPTY(&wrq->wr_list)) {
26137951040fSNavdeep Parhar slowpath:
26147951040fSNavdeep Parhar 		EQ_UNLOCK(eq);
26157951040fSNavdeep Parhar 		wr = alloc_wrqe(len16 * 16, wrq);
26167951040fSNavdeep Parhar 		if (__predict_false(wr == NULL))
26177951040fSNavdeep Parhar 			return (NULL);
26187951040fSNavdeep Parhar 		cookie->pidx = -1;
26197951040fSNavdeep Parhar 		cookie->ndesc = ndesc;
26207951040fSNavdeep Parhar 		return (&wr->wr);
26217951040fSNavdeep Parhar 	}
26227951040fSNavdeep Parhar 
26237951040fSNavdeep Parhar 	eq->cidx = read_hw_cidx(eq);
26247951040fSNavdeep Parhar 	if (eq->pidx == eq->cidx)
26257951040fSNavdeep Parhar 		available = eq->sidx - 1;
26267951040fSNavdeep Parhar 	else
26277951040fSNavdeep Parhar 		available = IDXDIFF(eq->cidx, eq->pidx, eq->sidx) - 1;
26287951040fSNavdeep Parhar 	if (available < ndesc)
26297951040fSNavdeep Parhar 		goto slowpath;
26307951040fSNavdeep Parhar 
26317951040fSNavdeep Parhar 	cookie->pidx = eq->pidx;
26327951040fSNavdeep Parhar 	cookie->ndesc = ndesc;
26337951040fSNavdeep Parhar 	TAILQ_INSERT_TAIL(&wrq->incomplete_wrs, cookie, link);
26347951040fSNavdeep Parhar 
26357951040fSNavdeep Parhar 	w = &eq->desc[eq->pidx];
26367951040fSNavdeep Parhar 	IDXINCR(eq->pidx, ndesc, eq->sidx);
2637f50c49ccSNavdeep Parhar 	if (__predict_false(cookie->pidx + ndesc > eq->sidx)) {
26387951040fSNavdeep Parhar 		w = &wrq->ss[0];
26397951040fSNavdeep Parhar 		wrq->ss_pidx = cookie->pidx;
26407951040fSNavdeep Parhar 		wrq->ss_len = len16 * 16;
26417951040fSNavdeep Parhar 	}
26427951040fSNavdeep Parhar 
26437951040fSNavdeep Parhar 	EQ_UNLOCK(eq);
26447951040fSNavdeep Parhar 
26457951040fSNavdeep Parhar 	return (w);
26467951040fSNavdeep Parhar }
26477951040fSNavdeep Parhar 
26487951040fSNavdeep Parhar void
26497951040fSNavdeep Parhar commit_wrq_wr(struct sge_wrq *wrq, void *w, struct wrq_cookie *cookie)
26507951040fSNavdeep Parhar {
26517951040fSNavdeep Parhar 	struct sge_eq *eq = &wrq->eq;
26527951040fSNavdeep Parhar 	struct adapter *sc = wrq->adapter;
26537951040fSNavdeep Parhar 	int ndesc, pidx;
26547951040fSNavdeep Parhar 	struct wrq_cookie *prev, *next;
26557951040fSNavdeep Parhar 
26567951040fSNavdeep Parhar 	if (cookie->pidx == -1) {
26577951040fSNavdeep Parhar 		struct wrqe *wr = __containerof(w, struct wrqe, wr);
26587951040fSNavdeep Parhar 
26597951040fSNavdeep Parhar 		t4_wrq_tx(sc, wr);
26607951040fSNavdeep Parhar 		return;
26617951040fSNavdeep Parhar 	}
26627951040fSNavdeep Parhar 
26637951040fSNavdeep Parhar 	if (__predict_false(w == &wrq->ss[0])) {
26647951040fSNavdeep Parhar 		int n = (eq->sidx - wrq->ss_pidx) * EQ_ESIZE;
26657951040fSNavdeep Parhar 
26667951040fSNavdeep Parhar 		MPASS(wrq->ss_len > n);	/* WR had better wrap around. */
26677951040fSNavdeep Parhar 		bcopy(&wrq->ss[0], &eq->desc[wrq->ss_pidx], n);
26687951040fSNavdeep Parhar 		bcopy(&wrq->ss[n], &eq->desc[0], wrq->ss_len - n);
26697951040fSNavdeep Parhar 		wrq->tx_wrs_ss++;
26707951040fSNavdeep Parhar 	} else
26717951040fSNavdeep Parhar 		wrq->tx_wrs_direct++;
26727951040fSNavdeep Parhar 
26737951040fSNavdeep Parhar 	EQ_LOCK(eq);
26748d6ae10aSNavdeep Parhar 	ndesc = cookie->ndesc;	/* Can be more than SGE_MAX_WR_NDESC here. */
26758d6ae10aSNavdeep Parhar 	pidx = cookie->pidx;
26768d6ae10aSNavdeep Parhar 	MPASS(pidx >= 0 && pidx < eq->sidx);
26777951040fSNavdeep Parhar 	prev = TAILQ_PREV(cookie, wrq_incomplete_wrs, link);
26787951040fSNavdeep Parhar 	next = TAILQ_NEXT(cookie, link);
26797951040fSNavdeep Parhar 	if (prev == NULL) {
26807951040fSNavdeep Parhar 		MPASS(pidx == eq->dbidx);
26812e09fe91SNavdeep Parhar 		if (next == NULL || ndesc >= 16) {
26822e09fe91SNavdeep Parhar 			int available;
26832e09fe91SNavdeep Parhar 			struct fw_eth_tx_pkt_wr *dst;	/* any fw WR struct will do */
26842e09fe91SNavdeep Parhar 
26852e09fe91SNavdeep Parhar 			/*
26862e09fe91SNavdeep Parhar 			 * Note that the WR via which we'll request tx updates
26872e09fe91SNavdeep Parhar 			 * is at pidx and not eq->pidx, which has moved on
26882e09fe91SNavdeep Parhar 			 * already.
26892e09fe91SNavdeep Parhar 			 */
26902e09fe91SNavdeep Parhar 			dst = (void *)&eq->desc[pidx];
26912e09fe91SNavdeep Parhar 			available = IDXDIFF(eq->cidx, eq->pidx, eq->sidx) - 1;
26922e09fe91SNavdeep Parhar 			if (available < eq->sidx / 4 &&
26932e09fe91SNavdeep Parhar 			    atomic_cmpset_int(&eq->equiq, 0, 1)) {
2694ddf09ad6SNavdeep Parhar 				/*
2695ddf09ad6SNavdeep Parhar 				 * XXX: This is not 100% reliable with some
2696ddf09ad6SNavdeep Parhar 				 * types of WRs.  But this is a very unusual
2697ddf09ad6SNavdeep Parhar 				 * situation for an ofld/ctrl queue anyway.
2698ddf09ad6SNavdeep Parhar 				 */
26992e09fe91SNavdeep Parhar 				dst->equiq_to_len16 |= htobe32(F_FW_WR_EQUIQ |
27002e09fe91SNavdeep Parhar 				    F_FW_WR_EQUEQ);
27012e09fe91SNavdeep Parhar 			}
27022e09fe91SNavdeep Parhar 
27037951040fSNavdeep Parhar 			ring_eq_db(wrq->adapter, eq, ndesc);
27042e09fe91SNavdeep Parhar 		} else {
27057951040fSNavdeep Parhar 			MPASS(IDXDIFF(next->pidx, pidx, eq->sidx) == ndesc);
27067951040fSNavdeep Parhar 			next->pidx = pidx;
27077951040fSNavdeep Parhar 			next->ndesc += ndesc;
27087951040fSNavdeep Parhar 		}
27097951040fSNavdeep Parhar 	} else {
27107951040fSNavdeep Parhar 		MPASS(IDXDIFF(pidx, prev->pidx, eq->sidx) == prev->ndesc);
27117951040fSNavdeep Parhar 		prev->ndesc += ndesc;
27127951040fSNavdeep Parhar 	}
27137951040fSNavdeep Parhar 	TAILQ_REMOVE(&wrq->incomplete_wrs, cookie, link);
27147951040fSNavdeep Parhar 
27157951040fSNavdeep Parhar 	if (TAILQ_EMPTY(&wrq->incomplete_wrs) && !STAILQ_EMPTY(&wrq->wr_list))
27167951040fSNavdeep Parhar 		drain_wrq_wr_list(sc, wrq);
27177951040fSNavdeep Parhar 
27187951040fSNavdeep Parhar #ifdef INVARIANTS
27197951040fSNavdeep Parhar 	if (TAILQ_EMPTY(&wrq->incomplete_wrs)) {
27207951040fSNavdeep Parhar 		/* Doorbell must have caught up to the pidx. */
27217951040fSNavdeep Parhar 		MPASS(wrq->eq.pidx == wrq->eq.dbidx);
27227951040fSNavdeep Parhar 	}
27237951040fSNavdeep Parhar #endif
27247951040fSNavdeep Parhar 	EQ_UNLOCK(eq);
27257951040fSNavdeep Parhar }
27267951040fSNavdeep Parhar 
27277951040fSNavdeep Parhar static u_int
27287951040fSNavdeep Parhar can_resume_eth_tx(struct mp_ring *r)
27297951040fSNavdeep Parhar {
27307951040fSNavdeep Parhar 	struct sge_eq *eq = r->cookie;
27317951040fSNavdeep Parhar 
27327951040fSNavdeep Parhar 	return (total_available_tx_desc(eq) > eq->sidx / 8);
27337951040fSNavdeep Parhar }
27347951040fSNavdeep Parhar 
27357951040fSNavdeep Parhar static inline int
27367951040fSNavdeep Parhar cannot_use_txpkts(struct mbuf *m)
27377951040fSNavdeep Parhar {
27387951040fSNavdeep Parhar 	/* maybe put a GL limit too, to avoid silliness? */
27397951040fSNavdeep Parhar 
2740*5cdaef71SJohn Baldwin 	return (needs_tso(m) || (mbuf_cflags(m) & MC_RAW_WR) != 0);
27417951040fSNavdeep Parhar }
27427951040fSNavdeep Parhar 
27431404daa7SNavdeep Parhar static inline int
27441404daa7SNavdeep Parhar discard_tx(struct sge_eq *eq)
27451404daa7SNavdeep Parhar {
27461404daa7SNavdeep Parhar 
27471404daa7SNavdeep Parhar 	return ((eq->flags & (EQ_ENABLED | EQ_QFLUSH)) != EQ_ENABLED);
27481404daa7SNavdeep Parhar }
27491404daa7SNavdeep Parhar 
2750*5cdaef71SJohn Baldwin static inline int
2751*5cdaef71SJohn Baldwin wr_can_update_eq(struct fw_eth_tx_pkts_wr *wr)
2752*5cdaef71SJohn Baldwin {
2753*5cdaef71SJohn Baldwin 
2754*5cdaef71SJohn Baldwin 	switch (G_FW_WR_OP(be32toh(wr->op_pkd))) {
2755*5cdaef71SJohn Baldwin 	case FW_ULPTX_WR:
2756*5cdaef71SJohn Baldwin 	case FW_ETH_TX_PKT_WR:
2757*5cdaef71SJohn Baldwin 	case FW_ETH_TX_PKTS_WR:
2758*5cdaef71SJohn Baldwin 	case FW_ETH_TX_PKT_VM_WR:
2759*5cdaef71SJohn Baldwin 		return (1);
2760*5cdaef71SJohn Baldwin 	default:
2761*5cdaef71SJohn Baldwin 		return (0);
2762*5cdaef71SJohn Baldwin 	}
2763*5cdaef71SJohn Baldwin }
2764*5cdaef71SJohn Baldwin 
27657951040fSNavdeep Parhar /*
27667951040fSNavdeep Parhar  * r->items[cidx] to r->items[pidx], with a wraparound at r->size, are ready to
27677951040fSNavdeep Parhar  * be consumed.  Return the actual number consumed.  0 indicates a stall.
27687951040fSNavdeep Parhar  */
27697951040fSNavdeep Parhar static u_int
27707951040fSNavdeep Parhar eth_tx(struct mp_ring *r, u_int cidx, u_int pidx)
27717951040fSNavdeep Parhar {
27727951040fSNavdeep Parhar 	struct sge_txq *txq = r->cookie;
27737951040fSNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
27747951040fSNavdeep Parhar 	struct ifnet *ifp = txq->ifp;
2775fe2ebb76SJohn Baldwin 	struct vi_info *vi = ifp->if_softc;
2776fe2ebb76SJohn Baldwin 	struct port_info *pi = vi->pi;
27777951040fSNavdeep Parhar 	struct adapter *sc = pi->adapter;
27787951040fSNavdeep Parhar 	u_int total, remaining;		/* # of packets */
27797951040fSNavdeep Parhar 	u_int available, dbdiff;	/* # of hardware descriptors */
27807951040fSNavdeep Parhar 	u_int n, next_cidx;
27817951040fSNavdeep Parhar 	struct mbuf *m0, *tail;
27827951040fSNavdeep Parhar 	struct txpkts txp;
27837951040fSNavdeep Parhar 	struct fw_eth_tx_pkts_wr *wr;	/* any fw WR struct will do */
27847951040fSNavdeep Parhar 
27857951040fSNavdeep Parhar 	remaining = IDXDIFF(pidx, cidx, r->size);
27867951040fSNavdeep Parhar 	MPASS(remaining > 0);	/* Must not be called without work to do. */
27877951040fSNavdeep Parhar 	total = 0;
27887951040fSNavdeep Parhar 
27897951040fSNavdeep Parhar 	TXQ_LOCK(txq);
27901404daa7SNavdeep Parhar 	if (__predict_false(discard_tx(eq))) {
27917951040fSNavdeep Parhar 		while (cidx != pidx) {
27927951040fSNavdeep Parhar 			m0 = r->items[cidx];
27937951040fSNavdeep Parhar 			m_freem(m0);
27947951040fSNavdeep Parhar 			if (++cidx == r->size)
27957951040fSNavdeep Parhar 				cidx = 0;
27967951040fSNavdeep Parhar 		}
27977951040fSNavdeep Parhar 		reclaim_tx_descs(txq, 2048);
27987951040fSNavdeep Parhar 		total = remaining;
27997951040fSNavdeep Parhar 		goto done;
28007951040fSNavdeep Parhar 	}
28017951040fSNavdeep Parhar 
28027951040fSNavdeep Parhar 	/* How many hardware descriptors do we have readily available. */
28037951040fSNavdeep Parhar 	if (eq->pidx == eq->cidx)
28047951040fSNavdeep Parhar 		available = eq->sidx - 1;
28057951040fSNavdeep Parhar 	else
28067951040fSNavdeep Parhar 		available = IDXDIFF(eq->cidx, eq->pidx, eq->sidx) - 1;
28077951040fSNavdeep Parhar 	dbdiff = IDXDIFF(eq->pidx, eq->dbidx, eq->sidx);
28087951040fSNavdeep Parhar 
28097951040fSNavdeep Parhar 	while (remaining > 0) {
28107951040fSNavdeep Parhar 
28117951040fSNavdeep Parhar 		m0 = r->items[cidx];
28127951040fSNavdeep Parhar 		M_ASSERTPKTHDR(m0);
28137951040fSNavdeep Parhar 		MPASS(m0->m_nextpkt == NULL);
28147951040fSNavdeep Parhar 
28157951040fSNavdeep Parhar 		if (available < SGE_MAX_WR_NDESC) {
28167951040fSNavdeep Parhar 			available += reclaim_tx_descs(txq, 64);
28177951040fSNavdeep Parhar 			if (available < howmany(mbuf_len16(m0), EQ_ESIZE / 16))
28187951040fSNavdeep Parhar 				break;	/* out of descriptors */
28197951040fSNavdeep Parhar 		}
28207951040fSNavdeep Parhar 
28217951040fSNavdeep Parhar 		next_cidx = cidx + 1;
28227951040fSNavdeep Parhar 		if (__predict_false(next_cidx == r->size))
28237951040fSNavdeep Parhar 			next_cidx = 0;
28247951040fSNavdeep Parhar 
28257951040fSNavdeep Parhar 		wr = (void *)&eq->desc[eq->pidx];
28266af45170SJohn Baldwin 		if (sc->flags & IS_VF) {
28276af45170SJohn Baldwin 			total++;
28286af45170SJohn Baldwin 			remaining--;
28296af45170SJohn Baldwin 			ETHER_BPF_MTAP(ifp, m0);
2830472a6004SNavdeep Parhar 			n = write_txpkt_vm_wr(sc, txq, (void *)wr, m0,
2831472a6004SNavdeep Parhar 			    available);
28326af45170SJohn Baldwin 		} else if (remaining > 1 &&
28337951040fSNavdeep Parhar 		    try_txpkts(m0, r->items[next_cidx], &txp, available) == 0) {
28347951040fSNavdeep Parhar 
28357951040fSNavdeep Parhar 			/* pkts at cidx, next_cidx should both be in txp. */
28367951040fSNavdeep Parhar 			MPASS(txp.npkt == 2);
28377951040fSNavdeep Parhar 			tail = r->items[next_cidx];
28387951040fSNavdeep Parhar 			MPASS(tail->m_nextpkt == NULL);
28397951040fSNavdeep Parhar 			ETHER_BPF_MTAP(ifp, m0);
28407951040fSNavdeep Parhar 			ETHER_BPF_MTAP(ifp, tail);
28417951040fSNavdeep Parhar 			m0->m_nextpkt = tail;
28427951040fSNavdeep Parhar 
28437951040fSNavdeep Parhar 			if (__predict_false(++next_cidx == r->size))
28447951040fSNavdeep Parhar 				next_cidx = 0;
28457951040fSNavdeep Parhar 
28467951040fSNavdeep Parhar 			while (next_cidx != pidx) {
28477951040fSNavdeep Parhar 				if (add_to_txpkts(r->items[next_cidx], &txp,
28487951040fSNavdeep Parhar 				    available) != 0)
28497951040fSNavdeep Parhar 					break;
28507951040fSNavdeep Parhar 				tail->m_nextpkt = r->items[next_cidx];
28517951040fSNavdeep Parhar 				tail = tail->m_nextpkt;
28527951040fSNavdeep Parhar 				ETHER_BPF_MTAP(ifp, tail);
28537951040fSNavdeep Parhar 				if (__predict_false(++next_cidx == r->size))
28547951040fSNavdeep Parhar 					next_cidx = 0;
28557951040fSNavdeep Parhar 			}
28567951040fSNavdeep Parhar 
28577951040fSNavdeep Parhar 			n = write_txpkts_wr(txq, wr, m0, &txp, available);
28587951040fSNavdeep Parhar 			total += txp.npkt;
28597951040fSNavdeep Parhar 			remaining -= txp.npkt;
2860*5cdaef71SJohn Baldwin 		} else if (mbuf_cflags(m0) & MC_RAW_WR) {
2861*5cdaef71SJohn Baldwin 			total++;
2862*5cdaef71SJohn Baldwin 			remaining--;
2863*5cdaef71SJohn Baldwin 			n = write_raw_wr(txq, (void *)wr, m0, available);
28647951040fSNavdeep Parhar 		} else {
28657951040fSNavdeep Parhar 			total++;
28667951040fSNavdeep Parhar 			remaining--;
28677951040fSNavdeep Parhar 			ETHER_BPF_MTAP(ifp, m0);
286878552b23SNavdeep Parhar 			n = write_txpkt_wr(txq, (void *)wr, m0, available);
28697951040fSNavdeep Parhar 		}
28707951040fSNavdeep Parhar 		MPASS(n >= 1 && n <= available && n <= SGE_MAX_WR_NDESC);
28717951040fSNavdeep Parhar 
28727951040fSNavdeep Parhar 		available -= n;
28737951040fSNavdeep Parhar 		dbdiff += n;
28747951040fSNavdeep Parhar 		IDXINCR(eq->pidx, n, eq->sidx);
28757951040fSNavdeep Parhar 
2876*5cdaef71SJohn Baldwin 		if (wr_can_update_eq(wr)) {
28777951040fSNavdeep Parhar 			if (total_available_tx_desc(eq) < eq->sidx / 4 &&
28787951040fSNavdeep Parhar 			    atomic_cmpset_int(&eq->equiq, 0, 1)) {
28797951040fSNavdeep Parhar 				wr->equiq_to_len16 |= htobe32(F_FW_WR_EQUIQ |
28807951040fSNavdeep Parhar 				    F_FW_WR_EQUEQ);
28817951040fSNavdeep Parhar 				eq->equeqidx = eq->pidx;
2882*5cdaef71SJohn Baldwin 			} else if (IDXDIFF(eq->pidx, eq->equeqidx, eq->sidx) >=
2883*5cdaef71SJohn Baldwin 			    32) {
28847951040fSNavdeep Parhar 				wr->equiq_to_len16 |= htobe32(F_FW_WR_EQUEQ);
28857951040fSNavdeep Parhar 				eq->equeqidx = eq->pidx;
28867951040fSNavdeep Parhar 			}
2887*5cdaef71SJohn Baldwin 		}
28887951040fSNavdeep Parhar 
28897951040fSNavdeep Parhar 		if (dbdiff >= 16 && remaining >= 4) {
28907951040fSNavdeep Parhar 			ring_eq_db(sc, eq, dbdiff);
28917951040fSNavdeep Parhar 			available += reclaim_tx_descs(txq, 4 * dbdiff);
28927951040fSNavdeep Parhar 			dbdiff = 0;
28937951040fSNavdeep Parhar 		}
28947951040fSNavdeep Parhar 
28957951040fSNavdeep Parhar 		cidx = next_cidx;
28967951040fSNavdeep Parhar 	}
28977951040fSNavdeep Parhar 	if (dbdiff != 0) {
28987951040fSNavdeep Parhar 		ring_eq_db(sc, eq, dbdiff);
28997951040fSNavdeep Parhar 		reclaim_tx_descs(txq, 32);
29007951040fSNavdeep Parhar 	}
29017951040fSNavdeep Parhar done:
29027951040fSNavdeep Parhar 	TXQ_UNLOCK(txq);
29037951040fSNavdeep Parhar 
29047951040fSNavdeep Parhar 	return (total);
2905733b9277SNavdeep Parhar }
2906733b9277SNavdeep Parhar 
290754e4ee71SNavdeep Parhar static inline void
290854e4ee71SNavdeep Parhar init_iq(struct sge_iq *iq, struct adapter *sc, int tmr_idx, int pktc_idx,
2909b2daa9a9SNavdeep Parhar     int qsize)
291054e4ee71SNavdeep Parhar {
2911b2daa9a9SNavdeep Parhar 
291254e4ee71SNavdeep Parhar 	KASSERT(tmr_idx >= 0 && tmr_idx < SGE_NTIMERS,
291354e4ee71SNavdeep Parhar 	    ("%s: bad tmr_idx %d", __func__, tmr_idx));
291454e4ee71SNavdeep Parhar 	KASSERT(pktc_idx < SGE_NCOUNTERS,	/* -ve is ok, means don't use */
291554e4ee71SNavdeep Parhar 	    ("%s: bad pktc_idx %d", __func__, pktc_idx));
291654e4ee71SNavdeep Parhar 
291754e4ee71SNavdeep Parhar 	iq->flags = 0;
291854e4ee71SNavdeep Parhar 	iq->adapter = sc;
29197a32954cSNavdeep Parhar 	iq->intr_params = V_QINTR_TIMER_IDX(tmr_idx);
29207a32954cSNavdeep Parhar 	iq->intr_pktc_idx = SGE_NCOUNTERS - 1;
29217a32954cSNavdeep Parhar 	if (pktc_idx >= 0) {
29227a32954cSNavdeep Parhar 		iq->intr_params |= F_QINTR_CNT_EN;
292354e4ee71SNavdeep Parhar 		iq->intr_pktc_idx = pktc_idx;
29247a32954cSNavdeep Parhar 	}
2925d14b0ac1SNavdeep Parhar 	iq->qsize = roundup2(qsize, 16);	/* See FW_IQ_CMD/iqsize */
292690e7434aSNavdeep Parhar 	iq->sidx = iq->qsize - sc->params.sge.spg_len / IQ_ESIZE;
292754e4ee71SNavdeep Parhar }
292854e4ee71SNavdeep Parhar 
292954e4ee71SNavdeep Parhar static inline void
2930e3207e19SNavdeep Parhar init_fl(struct adapter *sc, struct sge_fl *fl, int qsize, int maxp, char *name)
293154e4ee71SNavdeep Parhar {
29321458bff9SNavdeep Parhar 
293354e4ee71SNavdeep Parhar 	fl->qsize = qsize;
293490e7434aSNavdeep Parhar 	fl->sidx = qsize - sc->params.sge.spg_len / EQ_ESIZE;
293554e4ee71SNavdeep Parhar 	strlcpy(fl->lockname, name, sizeof(fl->lockname));
2936e3207e19SNavdeep Parhar 	if (sc->flags & BUF_PACKING_OK &&
2937e3207e19SNavdeep Parhar 	    ((!is_t4(sc) && buffer_packing) ||	/* T5+: enabled unless 0 */
2938e3207e19SNavdeep Parhar 	    (is_t4(sc) && buffer_packing == 1)))/* T4: disabled unless 1 */
29391458bff9SNavdeep Parhar 		fl->flags |= FL_BUF_PACKING;
294038035ed6SNavdeep Parhar 	find_best_refill_source(sc, fl, maxp);
294138035ed6SNavdeep Parhar 	find_safe_refill_source(sc, fl);
294254e4ee71SNavdeep Parhar }
294354e4ee71SNavdeep Parhar 
294454e4ee71SNavdeep Parhar static inline void
294590e7434aSNavdeep Parhar init_eq(struct adapter *sc, struct sge_eq *eq, int eqtype, int qsize,
294690e7434aSNavdeep Parhar     uint8_t tx_chan, uint16_t iqid, char *name)
294754e4ee71SNavdeep Parhar {
2948733b9277SNavdeep Parhar 	KASSERT(eqtype <= EQ_TYPEMASK, ("%s: bad qtype %d", __func__, eqtype));
2949733b9277SNavdeep Parhar 
2950733b9277SNavdeep Parhar 	eq->flags = eqtype & EQ_TYPEMASK;
2951733b9277SNavdeep Parhar 	eq->tx_chan = tx_chan;
2952733b9277SNavdeep Parhar 	eq->iqid = iqid;
295390e7434aSNavdeep Parhar 	eq->sidx = qsize - sc->params.sge.spg_len / EQ_ESIZE;
2954f7dfe243SNavdeep Parhar 	strlcpy(eq->lockname, name, sizeof(eq->lockname));
295554e4ee71SNavdeep Parhar }
295654e4ee71SNavdeep Parhar 
295754e4ee71SNavdeep Parhar static int
295854e4ee71SNavdeep Parhar alloc_ring(struct adapter *sc, size_t len, bus_dma_tag_t *tag,
295954e4ee71SNavdeep Parhar     bus_dmamap_t *map, bus_addr_t *pa, void **va)
296054e4ee71SNavdeep Parhar {
296154e4ee71SNavdeep Parhar 	int rc;
296254e4ee71SNavdeep Parhar 
296354e4ee71SNavdeep Parhar 	rc = bus_dma_tag_create(sc->dmat, 512, 0, BUS_SPACE_MAXADDR,
296454e4ee71SNavdeep Parhar 	    BUS_SPACE_MAXADDR, NULL, NULL, len, 1, len, 0, NULL, NULL, tag);
296554e4ee71SNavdeep Parhar 	if (rc != 0) {
296654e4ee71SNavdeep Parhar 		device_printf(sc->dev, "cannot allocate DMA tag: %d\n", rc);
296754e4ee71SNavdeep Parhar 		goto done;
296854e4ee71SNavdeep Parhar 	}
296954e4ee71SNavdeep Parhar 
297054e4ee71SNavdeep Parhar 	rc = bus_dmamem_alloc(*tag, va,
297154e4ee71SNavdeep Parhar 	    BUS_DMA_WAITOK | BUS_DMA_COHERENT | BUS_DMA_ZERO, map);
297254e4ee71SNavdeep Parhar 	if (rc != 0) {
297354e4ee71SNavdeep Parhar 		device_printf(sc->dev, "cannot allocate DMA memory: %d\n", rc);
297454e4ee71SNavdeep Parhar 		goto done;
297554e4ee71SNavdeep Parhar 	}
297654e4ee71SNavdeep Parhar 
297754e4ee71SNavdeep Parhar 	rc = bus_dmamap_load(*tag, *map, *va, len, oneseg_dma_callback, pa, 0);
297854e4ee71SNavdeep Parhar 	if (rc != 0) {
297954e4ee71SNavdeep Parhar 		device_printf(sc->dev, "cannot load DMA map: %d\n", rc);
298054e4ee71SNavdeep Parhar 		goto done;
298154e4ee71SNavdeep Parhar 	}
298254e4ee71SNavdeep Parhar done:
298354e4ee71SNavdeep Parhar 	if (rc)
298454e4ee71SNavdeep Parhar 		free_ring(sc, *tag, *map, *pa, *va);
298554e4ee71SNavdeep Parhar 
298654e4ee71SNavdeep Parhar 	return (rc);
298754e4ee71SNavdeep Parhar }
298854e4ee71SNavdeep Parhar 
298954e4ee71SNavdeep Parhar static int
299054e4ee71SNavdeep Parhar free_ring(struct adapter *sc, bus_dma_tag_t tag, bus_dmamap_t map,
299154e4ee71SNavdeep Parhar     bus_addr_t pa, void *va)
299254e4ee71SNavdeep Parhar {
299354e4ee71SNavdeep Parhar 	if (pa)
299454e4ee71SNavdeep Parhar 		bus_dmamap_unload(tag, map);
299554e4ee71SNavdeep Parhar 	if (va)
299654e4ee71SNavdeep Parhar 		bus_dmamem_free(tag, va, map);
299754e4ee71SNavdeep Parhar 	if (tag)
299854e4ee71SNavdeep Parhar 		bus_dma_tag_destroy(tag);
299954e4ee71SNavdeep Parhar 
300054e4ee71SNavdeep Parhar 	return (0);
300154e4ee71SNavdeep Parhar }
300254e4ee71SNavdeep Parhar 
300354e4ee71SNavdeep Parhar /*
300454e4ee71SNavdeep Parhar  * Allocates the ring for an ingress queue and an optional freelist.  If the
300554e4ee71SNavdeep Parhar  * freelist is specified it will be allocated and then associated with the
300654e4ee71SNavdeep Parhar  * ingress queue.
300754e4ee71SNavdeep Parhar  *
300854e4ee71SNavdeep Parhar  * Returns errno on failure.  Resources allocated up to that point may still be
300954e4ee71SNavdeep Parhar  * allocated.  Caller is responsible for cleanup in case this function fails.
301054e4ee71SNavdeep Parhar  *
3011f549e352SNavdeep Parhar  * If the ingress queue will take interrupts directly then the intr_idx
3012f549e352SNavdeep Parhar  * specifies the vector, starting from 0.  -1 means the interrupts for this
3013f549e352SNavdeep Parhar  * queue should be forwarded to the fwq.
301454e4ee71SNavdeep Parhar  */
301554e4ee71SNavdeep Parhar static int
3016fe2ebb76SJohn Baldwin alloc_iq_fl(struct vi_info *vi, struct sge_iq *iq, struct sge_fl *fl,
3017bc14b14dSNavdeep Parhar     int intr_idx, int cong)
301854e4ee71SNavdeep Parhar {
301954e4ee71SNavdeep Parhar 	int rc, i, cntxt_id;
302054e4ee71SNavdeep Parhar 	size_t len;
302154e4ee71SNavdeep Parhar 	struct fw_iq_cmd c;
3022fe2ebb76SJohn Baldwin 	struct port_info *pi = vi->pi;
302354e4ee71SNavdeep Parhar 	struct adapter *sc = iq->adapter;
302490e7434aSNavdeep Parhar 	struct sge_params *sp = &sc->params.sge;
302554e4ee71SNavdeep Parhar 	__be32 v = 0;
302654e4ee71SNavdeep Parhar 
3027b2daa9a9SNavdeep Parhar 	len = iq->qsize * IQ_ESIZE;
302854e4ee71SNavdeep Parhar 	rc = alloc_ring(sc, len, &iq->desc_tag, &iq->desc_map, &iq->ba,
302954e4ee71SNavdeep Parhar 	    (void **)&iq->desc);
303054e4ee71SNavdeep Parhar 	if (rc != 0)
303154e4ee71SNavdeep Parhar 		return (rc);
303254e4ee71SNavdeep Parhar 
303354e4ee71SNavdeep Parhar 	bzero(&c, sizeof(c));
303454e4ee71SNavdeep Parhar 	c.op_to_vfn = htobe32(V_FW_CMD_OP(FW_IQ_CMD) | F_FW_CMD_REQUEST |
303554e4ee71SNavdeep Parhar 	    F_FW_CMD_WRITE | F_FW_CMD_EXEC | V_FW_IQ_CMD_PFN(sc->pf) |
303654e4ee71SNavdeep Parhar 	    V_FW_IQ_CMD_VFN(0));
303754e4ee71SNavdeep Parhar 
303854e4ee71SNavdeep Parhar 	c.alloc_to_len16 = htobe32(F_FW_IQ_CMD_ALLOC | F_FW_IQ_CMD_IQSTART |
303954e4ee71SNavdeep Parhar 	    FW_LEN16(c));
304054e4ee71SNavdeep Parhar 
304154e4ee71SNavdeep Parhar 	/* Special handling for firmware event queue */
304254e4ee71SNavdeep Parhar 	if (iq == &sc->sge.fwq)
304354e4ee71SNavdeep Parhar 		v |= F_FW_IQ_CMD_IQASYNCH;
304454e4ee71SNavdeep Parhar 
3045f549e352SNavdeep Parhar 	if (intr_idx < 0) {
3046f549e352SNavdeep Parhar 		/* Forwarded interrupts, all headed to fwq */
3047f549e352SNavdeep Parhar 		v |= F_FW_IQ_CMD_IQANDST;
3048f549e352SNavdeep Parhar 		v |= V_FW_IQ_CMD_IQANDSTINDEX(sc->sge.fwq.cntxt_id);
3049f549e352SNavdeep Parhar 	} else {
305054e4ee71SNavdeep Parhar 		KASSERT(intr_idx < sc->intr_count,
305154e4ee71SNavdeep Parhar 		    ("%s: invalid direct intr_idx %d", __func__, intr_idx));
305254e4ee71SNavdeep Parhar 		v |= V_FW_IQ_CMD_IQANDSTINDEX(intr_idx);
3053f549e352SNavdeep Parhar 	}
305454e4ee71SNavdeep Parhar 
305554e4ee71SNavdeep Parhar 	c.type_to_iqandstindex = htobe32(v |
305654e4ee71SNavdeep Parhar 	    V_FW_IQ_CMD_TYPE(FW_IQ_TYPE_FL_INT_CAP) |
3057fe2ebb76SJohn Baldwin 	    V_FW_IQ_CMD_VIID(vi->viid) |
305854e4ee71SNavdeep Parhar 	    V_FW_IQ_CMD_IQANUD(X_UPDATEDELIVERY_INTERRUPT));
305954e4ee71SNavdeep Parhar 	c.iqdroprss_to_iqesize = htobe16(V_FW_IQ_CMD_IQPCIECH(pi->tx_chan) |
306054e4ee71SNavdeep Parhar 	    F_FW_IQ_CMD_IQGTSMODE |
306154e4ee71SNavdeep Parhar 	    V_FW_IQ_CMD_IQINTCNTTHRESH(iq->intr_pktc_idx) |
3062b2daa9a9SNavdeep Parhar 	    V_FW_IQ_CMD_IQESIZE(ilog2(IQ_ESIZE) - 4));
306354e4ee71SNavdeep Parhar 	c.iqsize = htobe16(iq->qsize);
306454e4ee71SNavdeep Parhar 	c.iqaddr = htobe64(iq->ba);
3065bc14b14dSNavdeep Parhar 	if (cong >= 0)
3066bc14b14dSNavdeep Parhar 		c.iqns_to_fl0congen = htobe32(F_FW_IQ_CMD_IQFLINTCONGEN);
306754e4ee71SNavdeep Parhar 
306854e4ee71SNavdeep Parhar 	if (fl) {
306954e4ee71SNavdeep Parhar 		mtx_init(&fl->fl_lock, fl->lockname, NULL, MTX_DEF);
307054e4ee71SNavdeep Parhar 
3071b2daa9a9SNavdeep Parhar 		len = fl->qsize * EQ_ESIZE;
307254e4ee71SNavdeep Parhar 		rc = alloc_ring(sc, len, &fl->desc_tag, &fl->desc_map,
307354e4ee71SNavdeep Parhar 		    &fl->ba, (void **)&fl->desc);
307454e4ee71SNavdeep Parhar 		if (rc)
307554e4ee71SNavdeep Parhar 			return (rc);
307654e4ee71SNavdeep Parhar 
307754e4ee71SNavdeep Parhar 		/* Allocate space for one software descriptor per buffer. */
307854e4ee71SNavdeep Parhar 		rc = alloc_fl_sdesc(fl);
307954e4ee71SNavdeep Parhar 		if (rc != 0) {
308054e4ee71SNavdeep Parhar 			device_printf(sc->dev,
308154e4ee71SNavdeep Parhar 			    "failed to setup fl software descriptors: %d\n",
308254e4ee71SNavdeep Parhar 			    rc);
308354e4ee71SNavdeep Parhar 			return (rc);
308454e4ee71SNavdeep Parhar 		}
30854d6db4e0SNavdeep Parhar 
30864d6db4e0SNavdeep Parhar 		if (fl->flags & FL_BUF_PACKING) {
308790e7434aSNavdeep Parhar 			fl->lowat = roundup2(sp->fl_starve_threshold2, 8);
308890e7434aSNavdeep Parhar 			fl->buf_boundary = sp->pack_boundary;
30894d6db4e0SNavdeep Parhar 		} else {
309090e7434aSNavdeep Parhar 			fl->lowat = roundup2(sp->fl_starve_threshold, 8);
3091e3207e19SNavdeep Parhar 			fl->buf_boundary = 16;
30924d6db4e0SNavdeep Parhar 		}
309390e7434aSNavdeep Parhar 		if (fl_pad && fl->buf_boundary < sp->pad_boundary)
309490e7434aSNavdeep Parhar 			fl->buf_boundary = sp->pad_boundary;
309554e4ee71SNavdeep Parhar 
3096214c3582SNavdeep Parhar 		c.iqns_to_fl0congen |=
3097bc14b14dSNavdeep Parhar 		    htobe32(V_FW_IQ_CMD_FL0HOSTFCMODE(X_HOSTFCMODE_NONE) |
3098bc14b14dSNavdeep Parhar 			F_FW_IQ_CMD_FL0FETCHRO | F_FW_IQ_CMD_FL0DATARO |
30991458bff9SNavdeep Parhar 			(fl_pad ? F_FW_IQ_CMD_FL0PADEN : 0) |
31001458bff9SNavdeep Parhar 			(fl->flags & FL_BUF_PACKING ? F_FW_IQ_CMD_FL0PACKEN :
31011458bff9SNavdeep Parhar 			    0));
3102bc14b14dSNavdeep Parhar 		if (cong >= 0) {
3103bc14b14dSNavdeep Parhar 			c.iqns_to_fl0congen |=
3104bc14b14dSNavdeep Parhar 				htobe32(V_FW_IQ_CMD_FL0CNGCHMAP(cong) |
3105bc14b14dSNavdeep Parhar 				    F_FW_IQ_CMD_FL0CONGCIF |
3106bc14b14dSNavdeep Parhar 				    F_FW_IQ_CMD_FL0CONGEN);
3107bc14b14dSNavdeep Parhar 		}
310854e4ee71SNavdeep Parhar 		c.fl0dcaen_to_fl0cidxfthresh =
3109ed7e5640SNavdeep Parhar 		    htobe16(V_FW_IQ_CMD_FL0FBMIN(chip_id(sc) <= CHELSIO_T5 ?
3110ed7e5640SNavdeep Parhar 			X_FETCHBURSTMIN_128B : X_FETCHBURSTMIN_64B) |
3111ed7e5640SNavdeep Parhar 			V_FW_IQ_CMD_FL0FBMAX(chip_id(sc) <= CHELSIO_T5 ?
3112ed7e5640SNavdeep Parhar 			X_FETCHBURSTMAX_512B : X_FETCHBURSTMAX_256B));
311354e4ee71SNavdeep Parhar 		c.fl0size = htobe16(fl->qsize);
311454e4ee71SNavdeep Parhar 		c.fl0addr = htobe64(fl->ba);
311554e4ee71SNavdeep Parhar 	}
311654e4ee71SNavdeep Parhar 
311754e4ee71SNavdeep Parhar 	rc = -t4_wr_mbox(sc, sc->mbox, &c, sizeof(c), &c);
311854e4ee71SNavdeep Parhar 	if (rc != 0) {
311954e4ee71SNavdeep Parhar 		device_printf(sc->dev,
312054e4ee71SNavdeep Parhar 		    "failed to create ingress queue: %d\n", rc);
312154e4ee71SNavdeep Parhar 		return (rc);
312254e4ee71SNavdeep Parhar 	}
312354e4ee71SNavdeep Parhar 
312454e4ee71SNavdeep Parhar 	iq->cidx = 0;
3125b2daa9a9SNavdeep Parhar 	iq->gen = F_RSPD_GEN;
312654e4ee71SNavdeep Parhar 	iq->intr_next = iq->intr_params;
312754e4ee71SNavdeep Parhar 	iq->cntxt_id = be16toh(c.iqid);
312854e4ee71SNavdeep Parhar 	iq->abs_id = be16toh(c.physiqid);
3129733b9277SNavdeep Parhar 	iq->flags |= IQ_ALLOCATED;
313054e4ee71SNavdeep Parhar 
313154e4ee71SNavdeep Parhar 	cntxt_id = iq->cntxt_id - sc->sge.iq_start;
3132733b9277SNavdeep Parhar 	if (cntxt_id >= sc->sge.niq) {
3133733b9277SNavdeep Parhar 		panic ("%s: iq->cntxt_id (%d) more than the max (%d)", __func__,
3134733b9277SNavdeep Parhar 		    cntxt_id, sc->sge.niq - 1);
3135733b9277SNavdeep Parhar 	}
313654e4ee71SNavdeep Parhar 	sc->sge.iqmap[cntxt_id] = iq;
313754e4ee71SNavdeep Parhar 
313854e4ee71SNavdeep Parhar 	if (fl) {
31394d6db4e0SNavdeep Parhar 		u_int qid;
31404d6db4e0SNavdeep Parhar 
31414d6db4e0SNavdeep Parhar 		iq->flags |= IQ_HAS_FL;
314254e4ee71SNavdeep Parhar 		fl->cntxt_id = be16toh(c.fl0id);
314354e4ee71SNavdeep Parhar 		fl->pidx = fl->cidx = 0;
314454e4ee71SNavdeep Parhar 
31459f1f7ec9SNavdeep Parhar 		cntxt_id = fl->cntxt_id - sc->sge.eq_start;
3146733b9277SNavdeep Parhar 		if (cntxt_id >= sc->sge.neq) {
3147733b9277SNavdeep Parhar 			panic("%s: fl->cntxt_id (%d) more than the max (%d)",
3148733b9277SNavdeep Parhar 			    __func__, cntxt_id, sc->sge.neq - 1);
3149733b9277SNavdeep Parhar 		}
315054e4ee71SNavdeep Parhar 		sc->sge.eqmap[cntxt_id] = (void *)fl;
315154e4ee71SNavdeep Parhar 
31524d6db4e0SNavdeep Parhar 		qid = fl->cntxt_id;
31534d6db4e0SNavdeep Parhar 		if (isset(&sc->doorbells, DOORBELL_UDB)) {
315490e7434aSNavdeep Parhar 			uint32_t s_qpp = sc->params.sge.eq_s_qpp;
31554d6db4e0SNavdeep Parhar 			uint32_t mask = (1 << s_qpp) - 1;
31564d6db4e0SNavdeep Parhar 			volatile uint8_t *udb;
31574d6db4e0SNavdeep Parhar 
31584d6db4e0SNavdeep Parhar 			udb = sc->udbs_base + UDBS_DB_OFFSET;
31594d6db4e0SNavdeep Parhar 			udb += (qid >> s_qpp) << PAGE_SHIFT;
31604d6db4e0SNavdeep Parhar 			qid &= mask;
31614d6db4e0SNavdeep Parhar 			if (qid < PAGE_SIZE / UDBS_SEG_SIZE) {
31624d6db4e0SNavdeep Parhar 				udb += qid << UDBS_SEG_SHIFT;
31634d6db4e0SNavdeep Parhar 				qid = 0;
31644d6db4e0SNavdeep Parhar 			}
31654d6db4e0SNavdeep Parhar 			fl->udb = (volatile void *)udb;
31664d6db4e0SNavdeep Parhar 		}
3167d1205d09SNavdeep Parhar 		fl->dbval = V_QID(qid) | sc->chip_params->sge_fl_db;
31684d6db4e0SNavdeep Parhar 
316954e4ee71SNavdeep Parhar 		FL_LOCK(fl);
3170733b9277SNavdeep Parhar 		/* Enough to make sure the SGE doesn't think it's starved */
3171733b9277SNavdeep Parhar 		refill_fl(sc, fl, fl->lowat);
317254e4ee71SNavdeep Parhar 		FL_UNLOCK(fl);
317354e4ee71SNavdeep Parhar 	}
317454e4ee71SNavdeep Parhar 
31758c0ca00bSNavdeep Parhar 	if (chip_id(sc) >= CHELSIO_T5 && !(sc->flags & IS_VF) && cong >= 0) {
3176ba41ec48SNavdeep Parhar 		uint32_t param, val;
3177ba41ec48SNavdeep Parhar 
3178ba41ec48SNavdeep Parhar 		param = V_FW_PARAMS_MNEM(FW_PARAMS_MNEM_DMAQ) |
3179ba41ec48SNavdeep Parhar 		    V_FW_PARAMS_PARAM_X(FW_PARAMS_PARAM_DMAQ_CONM_CTXT) |
3180ba41ec48SNavdeep Parhar 		    V_FW_PARAMS_PARAM_YZ(iq->cntxt_id);
318173cd9220SNavdeep Parhar 		if (cong == 0)
318273cd9220SNavdeep Parhar 			val = 1 << 19;
318373cd9220SNavdeep Parhar 		else {
318473cd9220SNavdeep Parhar 			val = 2 << 19;
318573cd9220SNavdeep Parhar 			for (i = 0; i < 4; i++) {
318673cd9220SNavdeep Parhar 				if (cong & (1 << i))
318773cd9220SNavdeep Parhar 					val |= 1 << (i << 2);
318873cd9220SNavdeep Parhar 			}
318973cd9220SNavdeep Parhar 		}
319073cd9220SNavdeep Parhar 
3191ba41ec48SNavdeep Parhar 		rc = -t4_set_params(sc, sc->mbox, sc->pf, 0, 1, &param, &val);
3192ba41ec48SNavdeep Parhar 		if (rc != 0) {
3193ba41ec48SNavdeep Parhar 			/* report error but carry on */
3194ba41ec48SNavdeep Parhar 			device_printf(sc->dev,
3195ba41ec48SNavdeep Parhar 			    "failed to set congestion manager context for "
3196ba41ec48SNavdeep Parhar 			    "ingress queue %d: %d\n", iq->cntxt_id, rc);
3197ba41ec48SNavdeep Parhar 		}
3198ba41ec48SNavdeep Parhar 	}
3199ba41ec48SNavdeep Parhar 
320054e4ee71SNavdeep Parhar 	/* Enable IQ interrupts */
3201733b9277SNavdeep Parhar 	atomic_store_rel_int(&iq->state, IQS_IDLE);
3202315048f2SJohn Baldwin 	t4_write_reg(sc, sc->sge_gts_reg, V_SEINTARM(iq->intr_params) |
320354e4ee71SNavdeep Parhar 	    V_INGRESSQID(iq->cntxt_id));
320454e4ee71SNavdeep Parhar 
320554e4ee71SNavdeep Parhar 	return (0);
320654e4ee71SNavdeep Parhar }
320754e4ee71SNavdeep Parhar 
320854e4ee71SNavdeep Parhar static int
3209fe2ebb76SJohn Baldwin free_iq_fl(struct vi_info *vi, struct sge_iq *iq, struct sge_fl *fl)
321054e4ee71SNavdeep Parhar {
321138035ed6SNavdeep Parhar 	int rc;
321254e4ee71SNavdeep Parhar 	struct adapter *sc = iq->adapter;
321354e4ee71SNavdeep Parhar 	device_t dev;
321454e4ee71SNavdeep Parhar 
321554e4ee71SNavdeep Parhar 	if (sc == NULL)
321654e4ee71SNavdeep Parhar 		return (0);	/* nothing to do */
321754e4ee71SNavdeep Parhar 
3218fe2ebb76SJohn Baldwin 	dev = vi ? vi->dev : sc->dev;
321954e4ee71SNavdeep Parhar 
322054e4ee71SNavdeep Parhar 	if (iq->flags & IQ_ALLOCATED) {
322154e4ee71SNavdeep Parhar 		rc = -t4_iq_free(sc, sc->mbox, sc->pf, 0,
322254e4ee71SNavdeep Parhar 		    FW_IQ_TYPE_FL_INT_CAP, iq->cntxt_id,
322354e4ee71SNavdeep Parhar 		    fl ? fl->cntxt_id : 0xffff, 0xffff);
322454e4ee71SNavdeep Parhar 		if (rc != 0) {
322554e4ee71SNavdeep Parhar 			device_printf(dev,
322654e4ee71SNavdeep Parhar 			    "failed to free queue %p: %d\n", iq, rc);
322754e4ee71SNavdeep Parhar 			return (rc);
322854e4ee71SNavdeep Parhar 		}
322954e4ee71SNavdeep Parhar 		iq->flags &= ~IQ_ALLOCATED;
323054e4ee71SNavdeep Parhar 	}
323154e4ee71SNavdeep Parhar 
323254e4ee71SNavdeep Parhar 	free_ring(sc, iq->desc_tag, iq->desc_map, iq->ba, iq->desc);
323354e4ee71SNavdeep Parhar 
323454e4ee71SNavdeep Parhar 	bzero(iq, sizeof(*iq));
323554e4ee71SNavdeep Parhar 
323654e4ee71SNavdeep Parhar 	if (fl) {
323754e4ee71SNavdeep Parhar 		free_ring(sc, fl->desc_tag, fl->desc_map, fl->ba,
323854e4ee71SNavdeep Parhar 		    fl->desc);
323954e4ee71SNavdeep Parhar 
3240aa9a5cc0SNavdeep Parhar 		if (fl->sdesc)
32411458bff9SNavdeep Parhar 			free_fl_sdesc(sc, fl);
32421458bff9SNavdeep Parhar 
324354e4ee71SNavdeep Parhar 		if (mtx_initialized(&fl->fl_lock))
324454e4ee71SNavdeep Parhar 			mtx_destroy(&fl->fl_lock);
324554e4ee71SNavdeep Parhar 
324654e4ee71SNavdeep Parhar 		bzero(fl, sizeof(*fl));
324754e4ee71SNavdeep Parhar 	}
324854e4ee71SNavdeep Parhar 
324954e4ee71SNavdeep Parhar 	return (0);
325054e4ee71SNavdeep Parhar }
325154e4ee71SNavdeep Parhar 
325238035ed6SNavdeep Parhar static void
3253348694daSNavdeep Parhar add_iq_sysctls(struct sysctl_ctx_list *ctx, struct sysctl_oid *oid,
3254348694daSNavdeep Parhar     struct sge_iq *iq)
3255348694daSNavdeep Parhar {
3256348694daSNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
3257348694daSNavdeep Parhar 
3258348694daSNavdeep Parhar 	SYSCTL_ADD_UAUTO(ctx, children, OID_AUTO, "ba", CTLFLAG_RD, &iq->ba,
3259348694daSNavdeep Parhar 	    "bus address of descriptor ring");
3260348694daSNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "dmalen", CTLFLAG_RD, NULL,
3261348694daSNavdeep Parhar 	    iq->qsize * IQ_ESIZE, "descriptor ring size in bytes");
3262348694daSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "abs_id",
3263348694daSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &iq->abs_id, 0, sysctl_uint16, "I",
3264348694daSNavdeep Parhar 	    "absolute id of the queue");
3265348694daSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cntxt_id",
3266348694daSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &iq->cntxt_id, 0, sysctl_uint16, "I",
3267348694daSNavdeep Parhar 	    "SGE context id of the queue");
3268348694daSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cidx",
3269348694daSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &iq->cidx, 0, sysctl_uint16, "I",
3270348694daSNavdeep Parhar 	    "consumer index");
3271348694daSNavdeep Parhar }
3272348694daSNavdeep Parhar 
3273348694daSNavdeep Parhar static void
3274aa93b99aSNavdeep Parhar add_fl_sysctls(struct adapter *sc, struct sysctl_ctx_list *ctx,
3275aa93b99aSNavdeep Parhar     struct sysctl_oid *oid, struct sge_fl *fl)
327638035ed6SNavdeep Parhar {
327738035ed6SNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
327838035ed6SNavdeep Parhar 
327938035ed6SNavdeep Parhar 	oid = SYSCTL_ADD_NODE(ctx, children, OID_AUTO, "fl", CTLFLAG_RD, NULL,
328038035ed6SNavdeep Parhar 	    "freelist");
328138035ed6SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
328238035ed6SNavdeep Parhar 
3283aa93b99aSNavdeep Parhar 	SYSCTL_ADD_UAUTO(ctx, children, OID_AUTO, "ba", CTLFLAG_RD,
3284aa93b99aSNavdeep Parhar 	    &fl->ba, "bus address of descriptor ring");
3285aa93b99aSNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "dmalen", CTLFLAG_RD, NULL,
3286aa93b99aSNavdeep Parhar 	    fl->sidx * EQ_ESIZE + sc->params.sge.spg_len,
3287aa93b99aSNavdeep Parhar 	    "desc ring size in bytes");
328838035ed6SNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cntxt_id",
328938035ed6SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &fl->cntxt_id, 0, sysctl_uint16, "I",
329038035ed6SNavdeep Parhar 	    "SGE context id of the freelist");
3291e3207e19SNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "padding", CTLFLAG_RD, NULL,
3292e3207e19SNavdeep Parhar 	    fl_pad ? 1 : 0, "padding enabled");
3293e3207e19SNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "packing", CTLFLAG_RD, NULL,
3294e3207e19SNavdeep Parhar 	    fl->flags & FL_BUF_PACKING ? 1 : 0, "packing enabled");
329538035ed6SNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "cidx", CTLFLAG_RD, &fl->cidx,
329638035ed6SNavdeep Parhar 	    0, "consumer index");
329738035ed6SNavdeep Parhar 	if (fl->flags & FL_BUF_PACKING) {
329838035ed6SNavdeep Parhar 		SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "rx_offset",
329938035ed6SNavdeep Parhar 		    CTLFLAG_RD, &fl->rx_offset, 0, "packing rx offset");
330038035ed6SNavdeep Parhar 	}
330138035ed6SNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "pidx", CTLFLAG_RD, &fl->pidx,
330238035ed6SNavdeep Parhar 	    0, "producer index");
330338035ed6SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "mbuf_allocated",
330438035ed6SNavdeep Parhar 	    CTLFLAG_RD, &fl->mbuf_allocated, "# of mbuf allocated");
330538035ed6SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "mbuf_inlined",
330638035ed6SNavdeep Parhar 	    CTLFLAG_RD, &fl->mbuf_inlined, "# of mbuf inlined in clusters");
330738035ed6SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "cluster_allocated",
330838035ed6SNavdeep Parhar 	    CTLFLAG_RD, &fl->cl_allocated, "# of clusters allocated");
330938035ed6SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "cluster_recycled",
331038035ed6SNavdeep Parhar 	    CTLFLAG_RD, &fl->cl_recycled, "# of clusters recycled");
331138035ed6SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "cluster_fast_recycled",
331238035ed6SNavdeep Parhar 	    CTLFLAG_RD, &fl->cl_fast_recycled, "# of clusters recycled (fast)");
331338035ed6SNavdeep Parhar }
331438035ed6SNavdeep Parhar 
331554e4ee71SNavdeep Parhar static int
3316733b9277SNavdeep Parhar alloc_fwq(struct adapter *sc)
331754e4ee71SNavdeep Parhar {
3318733b9277SNavdeep Parhar 	int rc, intr_idx;
331956599263SNavdeep Parhar 	struct sge_iq *fwq = &sc->sge.fwq;
3320733b9277SNavdeep Parhar 	struct sysctl_oid *oid = device_get_sysctl_tree(sc->dev);
3321733b9277SNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
332256599263SNavdeep Parhar 
3323b2daa9a9SNavdeep Parhar 	init_iq(fwq, sc, 0, 0, FW_IQ_QSIZE);
33246af45170SJohn Baldwin 	if (sc->flags & IS_VF)
33256af45170SJohn Baldwin 		intr_idx = 0;
33264535e804SNavdeep Parhar 	else
3327733b9277SNavdeep Parhar 		intr_idx = sc->intr_count > 1 ? 1 : 0;
3328fe2ebb76SJohn Baldwin 	rc = alloc_iq_fl(&sc->port[0]->vi[0], fwq, NULL, intr_idx, -1);
3329733b9277SNavdeep Parhar 	if (rc != 0) {
3330733b9277SNavdeep Parhar 		device_printf(sc->dev,
3331733b9277SNavdeep Parhar 		    "failed to create firmware event queue: %d\n", rc);
333256599263SNavdeep Parhar 		return (rc);
3333733b9277SNavdeep Parhar 	}
333456599263SNavdeep Parhar 
3335733b9277SNavdeep Parhar 	oid = SYSCTL_ADD_NODE(&sc->ctx, children, OID_AUTO, "fwq", CTLFLAG_RD,
3336733b9277SNavdeep Parhar 	    NULL, "firmware event queue");
3337348694daSNavdeep Parhar 	add_iq_sysctls(&sc->ctx, oid, fwq);
333856599263SNavdeep Parhar 
3339733b9277SNavdeep Parhar 	return (0);
3340733b9277SNavdeep Parhar }
3341733b9277SNavdeep Parhar 
3342733b9277SNavdeep Parhar static int
3343733b9277SNavdeep Parhar free_fwq(struct adapter *sc)
3344733b9277SNavdeep Parhar {
3345733b9277SNavdeep Parhar 	return free_iq_fl(NULL, &sc->sge.fwq, NULL);
3346733b9277SNavdeep Parhar }
3347733b9277SNavdeep Parhar 
3348733b9277SNavdeep Parhar static int
334937310a98SNavdeep Parhar alloc_ctrlq(struct adapter *sc, struct sge_wrq *ctrlq, int idx,
335037310a98SNavdeep Parhar     struct sysctl_oid *oid)
3351733b9277SNavdeep Parhar {
3352733b9277SNavdeep Parhar 	int rc;
3353733b9277SNavdeep Parhar 	char name[16];
335437310a98SNavdeep Parhar 	struct sysctl_oid_list *children;
3355733b9277SNavdeep Parhar 
335637310a98SNavdeep Parhar 	snprintf(name, sizeof(name), "%s ctrlq%d", device_get_nameunit(sc->dev),
335737310a98SNavdeep Parhar 	    idx);
335837310a98SNavdeep Parhar 	init_eq(sc, &ctrlq->eq, EQ_CTRL, CTRL_EQ_QSIZE, sc->port[idx]->tx_chan,
3359733b9277SNavdeep Parhar 	    sc->sge.fwq.cntxt_id, name);
336037310a98SNavdeep Parhar 
336137310a98SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
336237310a98SNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
336337310a98SNavdeep Parhar 	oid = SYSCTL_ADD_NODE(&sc->ctx, children, OID_AUTO, name, CTLFLAG_RD,
336437310a98SNavdeep Parhar 	    NULL, "ctrl queue");
336537310a98SNavdeep Parhar 	rc = alloc_wrq(sc, NULL, ctrlq, oid);
336637310a98SNavdeep Parhar 
336756599263SNavdeep Parhar 	return (rc);
336856599263SNavdeep Parhar }
336956599263SNavdeep Parhar 
33701605bac6SNavdeep Parhar int
33719af71ab3SNavdeep Parhar tnl_cong(struct port_info *pi, int drop)
33729fb8886bSNavdeep Parhar {
33739fb8886bSNavdeep Parhar 
33749af71ab3SNavdeep Parhar 	if (drop == -1)
33759fb8886bSNavdeep Parhar 		return (-1);
33769af71ab3SNavdeep Parhar 	else if (drop == 1)
33779fb8886bSNavdeep Parhar 		return (0);
33789fb8886bSNavdeep Parhar 	else
33795bcae8ddSNavdeep Parhar 		return (pi->rx_e_chan_map);
33809fb8886bSNavdeep Parhar }
33819fb8886bSNavdeep Parhar 
3382733b9277SNavdeep Parhar static int
3383fe2ebb76SJohn Baldwin alloc_rxq(struct vi_info *vi, struct sge_rxq *rxq, int intr_idx, int idx,
3384733b9277SNavdeep Parhar     struct sysctl_oid *oid)
338554e4ee71SNavdeep Parhar {
338654e4ee71SNavdeep Parhar 	int rc;
3387ec55567cSJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
338854e4ee71SNavdeep Parhar 	struct sysctl_oid_list *children;
338954e4ee71SNavdeep Parhar 	char name[16];
339054e4ee71SNavdeep Parhar 
3391fe2ebb76SJohn Baldwin 	rc = alloc_iq_fl(vi, &rxq->iq, &rxq->fl, intr_idx,
3392fe2ebb76SJohn Baldwin 	    tnl_cong(vi->pi, cong_drop));
339354e4ee71SNavdeep Parhar 	if (rc != 0)
339454e4ee71SNavdeep Parhar 		return (rc);
339554e4ee71SNavdeep Parhar 
3396ec55567cSJohn Baldwin 	if (idx == 0)
3397ec55567cSJohn Baldwin 		sc->sge.iq_base = rxq->iq.abs_id - rxq->iq.cntxt_id;
3398ec55567cSJohn Baldwin 	else
3399ec55567cSJohn Baldwin 		KASSERT(rxq->iq.cntxt_id + sc->sge.iq_base == rxq->iq.abs_id,
3400ec55567cSJohn Baldwin 		    ("iq_base mismatch"));
3401ec55567cSJohn Baldwin 	KASSERT(sc->sge.iq_base == 0 || sc->flags & IS_VF,
3402ec55567cSJohn Baldwin 	    ("PF with non-zero iq_base"));
3403ec55567cSJohn Baldwin 
34044d6db4e0SNavdeep Parhar 	/*
34054d6db4e0SNavdeep Parhar 	 * The freelist is just barely above the starvation threshold right now,
34064d6db4e0SNavdeep Parhar 	 * fill it up a bit more.
34074d6db4e0SNavdeep Parhar 	 */
34089b4d7b4eSNavdeep Parhar 	FL_LOCK(&rxq->fl);
3409ec55567cSJohn Baldwin 	refill_fl(sc, &rxq->fl, 128);
34109b4d7b4eSNavdeep Parhar 	FL_UNLOCK(&rxq->fl);
34119b4d7b4eSNavdeep Parhar 
3412a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
341346f48ee5SNavdeep Parhar 	rc = tcp_lro_init_args(&rxq->lro, vi->ifp, lro_entries, lro_mbufs);
341454e4ee71SNavdeep Parhar 	if (rc != 0)
341554e4ee71SNavdeep Parhar 		return (rc);
341646f48ee5SNavdeep Parhar 	MPASS(rxq->lro.ifp == vi->ifp);	/* also indicates LRO init'ed */
341754e4ee71SNavdeep Parhar 
3418fe2ebb76SJohn Baldwin 	if (vi->ifp->if_capenable & IFCAP_LRO)
3419733b9277SNavdeep Parhar 		rxq->iq.flags |= IQ_LRO_ENABLED;
342054e4ee71SNavdeep Parhar #endif
3421fe2ebb76SJohn Baldwin 	rxq->ifp = vi->ifp;
342254e4ee71SNavdeep Parhar 
3423733b9277SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
342454e4ee71SNavdeep Parhar 
342554e4ee71SNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
3426fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, name, CTLFLAG_RD,
342754e4ee71SNavdeep Parhar 	    NULL, "rx queue");
342854e4ee71SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
342954e4ee71SNavdeep Parhar 
3430348694daSNavdeep Parhar 	add_iq_sysctls(&vi->ctx, oid, &rxq->iq);
3431a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
3432e936121dSHans Petter Selasky 	SYSCTL_ADD_U64(&vi->ctx, children, OID_AUTO, "lro_queued", CTLFLAG_RD,
343354e4ee71SNavdeep Parhar 	    &rxq->lro.lro_queued, 0, NULL);
3434e936121dSHans Petter Selasky 	SYSCTL_ADD_U64(&vi->ctx, children, OID_AUTO, "lro_flushed", CTLFLAG_RD,
343554e4ee71SNavdeep Parhar 	    &rxq->lro.lro_flushed, 0, NULL);
34367d29df59SNavdeep Parhar #endif
3437fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "rxcsum", CTLFLAG_RD,
343854e4ee71SNavdeep Parhar 	    &rxq->rxcsum, "# of times hardware assisted with checksum");
3439fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "vlan_extraction",
344054e4ee71SNavdeep Parhar 	    CTLFLAG_RD, &rxq->vlan_extraction,
344154e4ee71SNavdeep Parhar 	    "# of times hardware extracted 802.1Q tag");
344254e4ee71SNavdeep Parhar 
3443aa93b99aSNavdeep Parhar 	add_fl_sysctls(sc, &vi->ctx, oid, &rxq->fl);
344459bc8ce0SNavdeep Parhar 
344554e4ee71SNavdeep Parhar 	return (rc);
344654e4ee71SNavdeep Parhar }
344754e4ee71SNavdeep Parhar 
344854e4ee71SNavdeep Parhar static int
3449fe2ebb76SJohn Baldwin free_rxq(struct vi_info *vi, struct sge_rxq *rxq)
345054e4ee71SNavdeep Parhar {
345154e4ee71SNavdeep Parhar 	int rc;
345254e4ee71SNavdeep Parhar 
3453a1ea9a82SNavdeep Parhar #if defined(INET) || defined(INET6)
345454e4ee71SNavdeep Parhar 	if (rxq->lro.ifp) {
345554e4ee71SNavdeep Parhar 		tcp_lro_free(&rxq->lro);
345654e4ee71SNavdeep Parhar 		rxq->lro.ifp = NULL;
345754e4ee71SNavdeep Parhar 	}
345854e4ee71SNavdeep Parhar #endif
345954e4ee71SNavdeep Parhar 
3460fe2ebb76SJohn Baldwin 	rc = free_iq_fl(vi, &rxq->iq, &rxq->fl);
346154e4ee71SNavdeep Parhar 	if (rc == 0)
346254e4ee71SNavdeep Parhar 		bzero(rxq, sizeof(*rxq));
346354e4ee71SNavdeep Parhar 
346454e4ee71SNavdeep Parhar 	return (rc);
346554e4ee71SNavdeep Parhar }
346654e4ee71SNavdeep Parhar 
346709fe6320SNavdeep Parhar #ifdef TCP_OFFLOAD
346854e4ee71SNavdeep Parhar static int
3469fe2ebb76SJohn Baldwin alloc_ofld_rxq(struct vi_info *vi, struct sge_ofld_rxq *ofld_rxq,
3470733b9277SNavdeep Parhar     int intr_idx, int idx, struct sysctl_oid *oid)
3471f7dfe243SNavdeep Parhar {
3472aa93b99aSNavdeep Parhar 	struct port_info *pi = vi->pi;
3473733b9277SNavdeep Parhar 	int rc;
3474f7dfe243SNavdeep Parhar 	struct sysctl_oid_list *children;
3475733b9277SNavdeep Parhar 	char name[16];
3476f7dfe243SNavdeep Parhar 
34775bcae8ddSNavdeep Parhar 	rc = alloc_iq_fl(vi, &ofld_rxq->iq, &ofld_rxq->fl, intr_idx, 0);
3478733b9277SNavdeep Parhar 	if (rc != 0)
3479f7dfe243SNavdeep Parhar 		return (rc);
3480f7dfe243SNavdeep Parhar 
3481733b9277SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3482733b9277SNavdeep Parhar 
3483733b9277SNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
3484fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, name, CTLFLAG_RD,
3485733b9277SNavdeep Parhar 	    NULL, "rx queue");
3486348694daSNavdeep Parhar 	add_iq_sysctls(&vi->ctx, oid, &ofld_rxq->iq);
3487aa93b99aSNavdeep Parhar 	add_fl_sysctls(pi->adapter, &vi->ctx, oid, &ofld_rxq->fl);
3488733b9277SNavdeep Parhar 
3489733b9277SNavdeep Parhar 	return (rc);
3490733b9277SNavdeep Parhar }
3491733b9277SNavdeep Parhar 
3492733b9277SNavdeep Parhar static int
3493fe2ebb76SJohn Baldwin free_ofld_rxq(struct vi_info *vi, struct sge_ofld_rxq *ofld_rxq)
3494733b9277SNavdeep Parhar {
3495733b9277SNavdeep Parhar 	int rc;
3496733b9277SNavdeep Parhar 
3497fe2ebb76SJohn Baldwin 	rc = free_iq_fl(vi, &ofld_rxq->iq, &ofld_rxq->fl);
3498733b9277SNavdeep Parhar 	if (rc == 0)
3499733b9277SNavdeep Parhar 		bzero(ofld_rxq, sizeof(*ofld_rxq));
3500733b9277SNavdeep Parhar 
3501733b9277SNavdeep Parhar 	return (rc);
3502733b9277SNavdeep Parhar }
3503733b9277SNavdeep Parhar #endif
3504733b9277SNavdeep Parhar 
3505298d969cSNavdeep Parhar #ifdef DEV_NETMAP
3506298d969cSNavdeep Parhar static int
3507fe2ebb76SJohn Baldwin alloc_nm_rxq(struct vi_info *vi, struct sge_nm_rxq *nm_rxq, int intr_idx,
3508298d969cSNavdeep Parhar     int idx, struct sysctl_oid *oid)
3509298d969cSNavdeep Parhar {
3510298d969cSNavdeep Parhar 	int rc;
3511298d969cSNavdeep Parhar 	struct sysctl_oid_list *children;
3512298d969cSNavdeep Parhar 	struct sysctl_ctx_list *ctx;
3513298d969cSNavdeep Parhar 	char name[16];
3514298d969cSNavdeep Parhar 	size_t len;
3515fe2ebb76SJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
3516fe2ebb76SJohn Baldwin 	struct netmap_adapter *na = NA(vi->ifp);
3517298d969cSNavdeep Parhar 
3518298d969cSNavdeep Parhar 	MPASS(na != NULL);
3519298d969cSNavdeep Parhar 
3520fe2ebb76SJohn Baldwin 	len = vi->qsize_rxq * IQ_ESIZE;
3521298d969cSNavdeep Parhar 	rc = alloc_ring(sc, len, &nm_rxq->iq_desc_tag, &nm_rxq->iq_desc_map,
3522298d969cSNavdeep Parhar 	    &nm_rxq->iq_ba, (void **)&nm_rxq->iq_desc);
3523298d969cSNavdeep Parhar 	if (rc != 0)
3524298d969cSNavdeep Parhar 		return (rc);
3525298d969cSNavdeep Parhar 
352690e7434aSNavdeep Parhar 	len = na->num_rx_desc * EQ_ESIZE + sc->params.sge.spg_len;
3527298d969cSNavdeep Parhar 	rc = alloc_ring(sc, len, &nm_rxq->fl_desc_tag, &nm_rxq->fl_desc_map,
3528298d969cSNavdeep Parhar 	    &nm_rxq->fl_ba, (void **)&nm_rxq->fl_desc);
3529298d969cSNavdeep Parhar 	if (rc != 0)
3530298d969cSNavdeep Parhar 		return (rc);
3531298d969cSNavdeep Parhar 
3532fe2ebb76SJohn Baldwin 	nm_rxq->vi = vi;
3533298d969cSNavdeep Parhar 	nm_rxq->nid = idx;
3534298d969cSNavdeep Parhar 	nm_rxq->iq_cidx = 0;
353590e7434aSNavdeep Parhar 	nm_rxq->iq_sidx = vi->qsize_rxq - sc->params.sge.spg_len / IQ_ESIZE;
3536298d969cSNavdeep Parhar 	nm_rxq->iq_gen = F_RSPD_GEN;
3537298d969cSNavdeep Parhar 	nm_rxq->fl_pidx = nm_rxq->fl_cidx = 0;
3538298d969cSNavdeep Parhar 	nm_rxq->fl_sidx = na->num_rx_desc;
3539298d969cSNavdeep Parhar 	nm_rxq->intr_idx = intr_idx;
3540a8c4fcb9SNavdeep Parhar 	nm_rxq->iq_cntxt_id = INVALID_NM_RXQ_CNTXT_ID;
3541298d969cSNavdeep Parhar 
3542fe2ebb76SJohn Baldwin 	ctx = &vi->ctx;
3543298d969cSNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3544298d969cSNavdeep Parhar 
3545298d969cSNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
3546298d969cSNavdeep Parhar 	oid = SYSCTL_ADD_NODE(ctx, children, OID_AUTO, name, CTLFLAG_RD, NULL,
3547298d969cSNavdeep Parhar 	    "rx queue");
3548298d969cSNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3549298d969cSNavdeep Parhar 
3550298d969cSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "abs_id",
3551298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_rxq->iq_abs_id, 0, sysctl_uint16,
3552298d969cSNavdeep Parhar 	    "I", "absolute id of the queue");
3553298d969cSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cntxt_id",
3554298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_rxq->iq_cntxt_id, 0, sysctl_uint16,
3555298d969cSNavdeep Parhar 	    "I", "SGE context id of the queue");
3556298d969cSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cidx",
3557298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_rxq->iq_cidx, 0, sysctl_uint16, "I",
3558298d969cSNavdeep Parhar 	    "consumer index");
3559298d969cSNavdeep Parhar 
3560298d969cSNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3561298d969cSNavdeep Parhar 	oid = SYSCTL_ADD_NODE(ctx, children, OID_AUTO, "fl", CTLFLAG_RD, NULL,
3562298d969cSNavdeep Parhar 	    "freelist");
3563298d969cSNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3564298d969cSNavdeep Parhar 
3565298d969cSNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cntxt_id",
3566298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_rxq->fl_cntxt_id, 0, sysctl_uint16,
3567298d969cSNavdeep Parhar 	    "I", "SGE context id of the freelist");
3568298d969cSNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "cidx", CTLFLAG_RD,
3569298d969cSNavdeep Parhar 	    &nm_rxq->fl_cidx, 0, "consumer index");
3570298d969cSNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "pidx", CTLFLAG_RD,
3571298d969cSNavdeep Parhar 	    &nm_rxq->fl_pidx, 0, "producer index");
3572298d969cSNavdeep Parhar 
3573298d969cSNavdeep Parhar 	return (rc);
3574298d969cSNavdeep Parhar }
3575298d969cSNavdeep Parhar 
3576298d969cSNavdeep Parhar 
3577298d969cSNavdeep Parhar static int
3578fe2ebb76SJohn Baldwin free_nm_rxq(struct vi_info *vi, struct sge_nm_rxq *nm_rxq)
3579298d969cSNavdeep Parhar {
3580fe2ebb76SJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
3581298d969cSNavdeep Parhar 
35820fa7560dSNavdeep Parhar 	if (vi->flags & VI_INIT_DONE)
3583a8c4fcb9SNavdeep Parhar 		MPASS(nm_rxq->iq_cntxt_id == INVALID_NM_RXQ_CNTXT_ID);
35840fa7560dSNavdeep Parhar 	else
35850fa7560dSNavdeep Parhar 		MPASS(nm_rxq->iq_cntxt_id == 0);
3586a8c4fcb9SNavdeep Parhar 
3587298d969cSNavdeep Parhar 	free_ring(sc, nm_rxq->iq_desc_tag, nm_rxq->iq_desc_map, nm_rxq->iq_ba,
3588298d969cSNavdeep Parhar 	    nm_rxq->iq_desc);
3589298d969cSNavdeep Parhar 	free_ring(sc, nm_rxq->fl_desc_tag, nm_rxq->fl_desc_map, nm_rxq->fl_ba,
3590298d969cSNavdeep Parhar 	    nm_rxq->fl_desc);
3591298d969cSNavdeep Parhar 
3592298d969cSNavdeep Parhar 	return (0);
3593298d969cSNavdeep Parhar }
3594298d969cSNavdeep Parhar 
3595298d969cSNavdeep Parhar static int
3596fe2ebb76SJohn Baldwin alloc_nm_txq(struct vi_info *vi, struct sge_nm_txq *nm_txq, int iqidx, int idx,
3597298d969cSNavdeep Parhar     struct sysctl_oid *oid)
3598298d969cSNavdeep Parhar {
3599298d969cSNavdeep Parhar 	int rc;
3600298d969cSNavdeep Parhar 	size_t len;
3601fe2ebb76SJohn Baldwin 	struct port_info *pi = vi->pi;
3602298d969cSNavdeep Parhar 	struct adapter *sc = pi->adapter;
3603fe2ebb76SJohn Baldwin 	struct netmap_adapter *na = NA(vi->ifp);
3604298d969cSNavdeep Parhar 	char name[16];
3605298d969cSNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
3606298d969cSNavdeep Parhar 
360790e7434aSNavdeep Parhar 	len = na->num_tx_desc * EQ_ESIZE + sc->params.sge.spg_len;
3608298d969cSNavdeep Parhar 	rc = alloc_ring(sc, len, &nm_txq->desc_tag, &nm_txq->desc_map,
3609298d969cSNavdeep Parhar 	    &nm_txq->ba, (void **)&nm_txq->desc);
3610298d969cSNavdeep Parhar 	if (rc)
3611298d969cSNavdeep Parhar 		return (rc);
3612298d969cSNavdeep Parhar 
3613298d969cSNavdeep Parhar 	nm_txq->pidx = nm_txq->cidx = 0;
3614298d969cSNavdeep Parhar 	nm_txq->sidx = na->num_tx_desc;
3615298d969cSNavdeep Parhar 	nm_txq->nid = idx;
3616298d969cSNavdeep Parhar 	nm_txq->iqidx = iqidx;
3617298d969cSNavdeep Parhar 	nm_txq->cpl_ctrl0 = htobe32(V_TXPKT_OPCODE(CPL_TX_PKT) |
361897f2919dSNavdeep Parhar 	    V_TXPKT_INTF(pi->tx_chan) | V_TXPKT_PF(G_FW_VIID_PFN(vi->viid)) |
361997f2919dSNavdeep Parhar 	    V_TXPKT_VF(G_FW_VIID_VIN(vi->viid)) |
362097f2919dSNavdeep Parhar 	    V_TXPKT_VF_VLD(G_FW_VIID_VIVLD(vi->viid)));
3621a8c4fcb9SNavdeep Parhar 	nm_txq->cntxt_id = INVALID_NM_TXQ_CNTXT_ID;
3622298d969cSNavdeep Parhar 
3623298d969cSNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
3624fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, name, CTLFLAG_RD,
3625298d969cSNavdeep Parhar 	    NULL, "netmap tx queue");
3626298d969cSNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
3627298d969cSNavdeep Parhar 
3628fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UINT(&vi->ctx, children, OID_AUTO, "cntxt_id", CTLFLAG_RD,
3629298d969cSNavdeep Parhar 	    &nm_txq->cntxt_id, 0, "SGE context id of the queue");
3630fe2ebb76SJohn Baldwin 	SYSCTL_ADD_PROC(&vi->ctx, children, OID_AUTO, "cidx",
3631298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_txq->cidx, 0, sysctl_uint16, "I",
3632298d969cSNavdeep Parhar 	    "consumer index");
3633fe2ebb76SJohn Baldwin 	SYSCTL_ADD_PROC(&vi->ctx, children, OID_AUTO, "pidx",
3634298d969cSNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &nm_txq->pidx, 0, sysctl_uint16, "I",
3635298d969cSNavdeep Parhar 	    "producer index");
3636298d969cSNavdeep Parhar 
3637298d969cSNavdeep Parhar 	return (rc);
3638298d969cSNavdeep Parhar }
3639298d969cSNavdeep Parhar 
3640298d969cSNavdeep Parhar static int
3641fe2ebb76SJohn Baldwin free_nm_txq(struct vi_info *vi, struct sge_nm_txq *nm_txq)
3642298d969cSNavdeep Parhar {
3643fe2ebb76SJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
3644298d969cSNavdeep Parhar 
36450fa7560dSNavdeep Parhar 	if (vi->flags & VI_INIT_DONE)
3646a8c4fcb9SNavdeep Parhar 		MPASS(nm_txq->cntxt_id == INVALID_NM_TXQ_CNTXT_ID);
36470fa7560dSNavdeep Parhar 	else
36480fa7560dSNavdeep Parhar 		MPASS(nm_txq->cntxt_id == 0);
3649a8c4fcb9SNavdeep Parhar 
3650298d969cSNavdeep Parhar 	free_ring(sc, nm_txq->desc_tag, nm_txq->desc_map, nm_txq->ba,
3651298d969cSNavdeep Parhar 	    nm_txq->desc);
3652298d969cSNavdeep Parhar 
3653298d969cSNavdeep Parhar 	return (0);
3654298d969cSNavdeep Parhar }
3655298d969cSNavdeep Parhar #endif
3656298d969cSNavdeep Parhar 
3657ddf09ad6SNavdeep Parhar /*
3658ddf09ad6SNavdeep Parhar  * Returns a reasonable automatic cidx flush threshold for a given queue size.
3659ddf09ad6SNavdeep Parhar  */
3660ddf09ad6SNavdeep Parhar static u_int
3661ddf09ad6SNavdeep Parhar qsize_to_fthresh(int qsize)
3662ddf09ad6SNavdeep Parhar {
3663ddf09ad6SNavdeep Parhar 	u_int fthresh;
3664ddf09ad6SNavdeep Parhar 
3665ddf09ad6SNavdeep Parhar 	while (!powerof2(qsize))
3666ddf09ad6SNavdeep Parhar 		qsize++;
3667ddf09ad6SNavdeep Parhar 	fthresh = ilog2(qsize);
3668ddf09ad6SNavdeep Parhar 	if (fthresh > X_CIDXFLUSHTHRESH_128)
3669ddf09ad6SNavdeep Parhar 		fthresh = X_CIDXFLUSHTHRESH_128;
3670ddf09ad6SNavdeep Parhar 
3671ddf09ad6SNavdeep Parhar 	return (fthresh);
3672ddf09ad6SNavdeep Parhar }
3673ddf09ad6SNavdeep Parhar 
3674733b9277SNavdeep Parhar static int
3675733b9277SNavdeep Parhar ctrl_eq_alloc(struct adapter *sc, struct sge_eq *eq)
3676733b9277SNavdeep Parhar {
3677733b9277SNavdeep Parhar 	int rc, cntxt_id;
3678733b9277SNavdeep Parhar 	struct fw_eq_ctrl_cmd c;
367990e7434aSNavdeep Parhar 	int qsize = eq->sidx + sc->params.sge.spg_len / EQ_ESIZE;
3680f7dfe243SNavdeep Parhar 
3681f7dfe243SNavdeep Parhar 	bzero(&c, sizeof(c));
3682f7dfe243SNavdeep Parhar 
3683f7dfe243SNavdeep Parhar 	c.op_to_vfn = htobe32(V_FW_CMD_OP(FW_EQ_CTRL_CMD) | F_FW_CMD_REQUEST |
3684f7dfe243SNavdeep Parhar 	    F_FW_CMD_WRITE | F_FW_CMD_EXEC | V_FW_EQ_CTRL_CMD_PFN(sc->pf) |
3685f7dfe243SNavdeep Parhar 	    V_FW_EQ_CTRL_CMD_VFN(0));
3686f7dfe243SNavdeep Parhar 	c.alloc_to_len16 = htobe32(F_FW_EQ_CTRL_CMD_ALLOC |
3687f7dfe243SNavdeep Parhar 	    F_FW_EQ_CTRL_CMD_EQSTART | FW_LEN16(c));
36887951040fSNavdeep Parhar 	c.cmpliqid_eqid = htonl(V_FW_EQ_CTRL_CMD_CMPLIQID(eq->iqid));
3689f7dfe243SNavdeep Parhar 	c.physeqid_pkd = htobe32(0);
3690f7dfe243SNavdeep Parhar 	c.fetchszm_to_iqid =
369187b027baSNavdeep Parhar 	    htobe32(V_FW_EQ_CTRL_CMD_HOSTFCMODE(X_HOSTFCMODE_STATUS_PAGE) |
3692733b9277SNavdeep Parhar 		V_FW_EQ_CTRL_CMD_PCIECHN(eq->tx_chan) |
369356599263SNavdeep Parhar 		F_FW_EQ_CTRL_CMD_FETCHRO | V_FW_EQ_CTRL_CMD_IQID(eq->iqid));
3694f7dfe243SNavdeep Parhar 	c.dcaen_to_eqsize =
3695f7dfe243SNavdeep Parhar 	    htobe32(V_FW_EQ_CTRL_CMD_FBMIN(X_FETCHBURSTMIN_64B) |
3696f7dfe243SNavdeep Parhar 		V_FW_EQ_CTRL_CMD_FBMAX(X_FETCHBURSTMAX_512B) |
3697ddf09ad6SNavdeep Parhar 		V_FW_EQ_CTRL_CMD_CIDXFTHRESH(qsize_to_fthresh(qsize)) |
36987951040fSNavdeep Parhar 		V_FW_EQ_CTRL_CMD_EQSIZE(qsize));
3699f7dfe243SNavdeep Parhar 	c.eqaddr = htobe64(eq->ba);
3700f7dfe243SNavdeep Parhar 
3701f7dfe243SNavdeep Parhar 	rc = -t4_wr_mbox(sc, sc->mbox, &c, sizeof(c), &c);
3702f7dfe243SNavdeep Parhar 	if (rc != 0) {
3703f7dfe243SNavdeep Parhar 		device_printf(sc->dev,
3704733b9277SNavdeep Parhar 		    "failed to create control queue %d: %d\n", eq->tx_chan, rc);
3705f7dfe243SNavdeep Parhar 		return (rc);
3706f7dfe243SNavdeep Parhar 	}
3707733b9277SNavdeep Parhar 	eq->flags |= EQ_ALLOCATED;
3708f7dfe243SNavdeep Parhar 
3709f7dfe243SNavdeep Parhar 	eq->cntxt_id = G_FW_EQ_CTRL_CMD_EQID(be32toh(c.cmpliqid_eqid));
3710f7dfe243SNavdeep Parhar 	cntxt_id = eq->cntxt_id - sc->sge.eq_start;
3711733b9277SNavdeep Parhar 	if (cntxt_id >= sc->sge.neq)
3712733b9277SNavdeep Parhar 	    panic("%s: eq->cntxt_id (%d) more than the max (%d)", __func__,
3713733b9277SNavdeep Parhar 		cntxt_id, sc->sge.neq - 1);
3714f7dfe243SNavdeep Parhar 	sc->sge.eqmap[cntxt_id] = eq;
3715f7dfe243SNavdeep Parhar 
3716f7dfe243SNavdeep Parhar 	return (rc);
3717f7dfe243SNavdeep Parhar }
3718f7dfe243SNavdeep Parhar 
3719f7dfe243SNavdeep Parhar static int
3720fe2ebb76SJohn Baldwin eth_eq_alloc(struct adapter *sc, struct vi_info *vi, struct sge_eq *eq)
372154e4ee71SNavdeep Parhar {
372254e4ee71SNavdeep Parhar 	int rc, cntxt_id;
372354e4ee71SNavdeep Parhar 	struct fw_eq_eth_cmd c;
372490e7434aSNavdeep Parhar 	int qsize = eq->sidx + sc->params.sge.spg_len / EQ_ESIZE;
372554e4ee71SNavdeep Parhar 
372654e4ee71SNavdeep Parhar 	bzero(&c, sizeof(c));
372754e4ee71SNavdeep Parhar 
372854e4ee71SNavdeep Parhar 	c.op_to_vfn = htobe32(V_FW_CMD_OP(FW_EQ_ETH_CMD) | F_FW_CMD_REQUEST |
372954e4ee71SNavdeep Parhar 	    F_FW_CMD_WRITE | F_FW_CMD_EXEC | V_FW_EQ_ETH_CMD_PFN(sc->pf) |
373054e4ee71SNavdeep Parhar 	    V_FW_EQ_ETH_CMD_VFN(0));
373154e4ee71SNavdeep Parhar 	c.alloc_to_len16 = htobe32(F_FW_EQ_ETH_CMD_ALLOC |
373254e4ee71SNavdeep Parhar 	    F_FW_EQ_ETH_CMD_EQSTART | FW_LEN16(c));
37337951040fSNavdeep Parhar 	c.autoequiqe_to_viid = htobe32(F_FW_EQ_ETH_CMD_AUTOEQUIQE |
3734fe2ebb76SJohn Baldwin 	    F_FW_EQ_ETH_CMD_AUTOEQUEQE | V_FW_EQ_ETH_CMD_VIID(vi->viid));
373554e4ee71SNavdeep Parhar 	c.fetchszm_to_iqid =
37367951040fSNavdeep Parhar 	    htobe32(V_FW_EQ_ETH_CMD_HOSTFCMODE(X_HOSTFCMODE_NONE) |
3737733b9277SNavdeep Parhar 		V_FW_EQ_ETH_CMD_PCIECHN(eq->tx_chan) | F_FW_EQ_ETH_CMD_FETCHRO |
3738aa2457e1SNavdeep Parhar 		V_FW_EQ_ETH_CMD_IQID(eq->iqid));
373954e4ee71SNavdeep Parhar 	c.dcaen_to_eqsize = htobe32(V_FW_EQ_ETH_CMD_FBMIN(X_FETCHBURSTMIN_64B) |
374054e4ee71SNavdeep Parhar 	    V_FW_EQ_ETH_CMD_FBMAX(X_FETCHBURSTMAX_512B) |
37417951040fSNavdeep Parhar 	    V_FW_EQ_ETH_CMD_EQSIZE(qsize));
374254e4ee71SNavdeep Parhar 	c.eqaddr = htobe64(eq->ba);
374354e4ee71SNavdeep Parhar 
374454e4ee71SNavdeep Parhar 	rc = -t4_wr_mbox(sc, sc->mbox, &c, sizeof(c), &c);
374554e4ee71SNavdeep Parhar 	if (rc != 0) {
3746fe2ebb76SJohn Baldwin 		device_printf(vi->dev,
3747733b9277SNavdeep Parhar 		    "failed to create Ethernet egress queue: %d\n", rc);
3748733b9277SNavdeep Parhar 		return (rc);
3749733b9277SNavdeep Parhar 	}
3750733b9277SNavdeep Parhar 	eq->flags |= EQ_ALLOCATED;
3751733b9277SNavdeep Parhar 
3752733b9277SNavdeep Parhar 	eq->cntxt_id = G_FW_EQ_ETH_CMD_EQID(be32toh(c.eqid_pkd));
3753ec55567cSJohn Baldwin 	eq->abs_id = G_FW_EQ_ETH_CMD_PHYSEQID(be32toh(c.physeqid_pkd));
3754733b9277SNavdeep Parhar 	cntxt_id = eq->cntxt_id - sc->sge.eq_start;
3755733b9277SNavdeep Parhar 	if (cntxt_id >= sc->sge.neq)
3756733b9277SNavdeep Parhar 	    panic("%s: eq->cntxt_id (%d) more than the max (%d)", __func__,
3757733b9277SNavdeep Parhar 		cntxt_id, sc->sge.neq - 1);
3758733b9277SNavdeep Parhar 	sc->sge.eqmap[cntxt_id] = eq;
3759733b9277SNavdeep Parhar 
376054e4ee71SNavdeep Parhar 	return (rc);
376154e4ee71SNavdeep Parhar }
376254e4ee71SNavdeep Parhar 
3763eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
3764733b9277SNavdeep Parhar static int
3765fe2ebb76SJohn Baldwin ofld_eq_alloc(struct adapter *sc, struct vi_info *vi, struct sge_eq *eq)
3766733b9277SNavdeep Parhar {
3767733b9277SNavdeep Parhar 	int rc, cntxt_id;
3768733b9277SNavdeep Parhar 	struct fw_eq_ofld_cmd c;
376990e7434aSNavdeep Parhar 	int qsize = eq->sidx + sc->params.sge.spg_len / EQ_ESIZE;
377054e4ee71SNavdeep Parhar 
3771733b9277SNavdeep Parhar 	bzero(&c, sizeof(c));
3772733b9277SNavdeep Parhar 
3773733b9277SNavdeep Parhar 	c.op_to_vfn = htonl(V_FW_CMD_OP(FW_EQ_OFLD_CMD) | F_FW_CMD_REQUEST |
3774733b9277SNavdeep Parhar 	    F_FW_CMD_WRITE | F_FW_CMD_EXEC | V_FW_EQ_OFLD_CMD_PFN(sc->pf) |
3775733b9277SNavdeep Parhar 	    V_FW_EQ_OFLD_CMD_VFN(0));
3776733b9277SNavdeep Parhar 	c.alloc_to_len16 = htonl(F_FW_EQ_OFLD_CMD_ALLOC |
3777733b9277SNavdeep Parhar 	    F_FW_EQ_OFLD_CMD_EQSTART | FW_LEN16(c));
3778733b9277SNavdeep Parhar 	c.fetchszm_to_iqid =
3779ddf09ad6SNavdeep Parhar 		htonl(V_FW_EQ_OFLD_CMD_HOSTFCMODE(X_HOSTFCMODE_STATUS_PAGE) |
3780733b9277SNavdeep Parhar 		    V_FW_EQ_OFLD_CMD_PCIECHN(eq->tx_chan) |
3781733b9277SNavdeep Parhar 		    F_FW_EQ_OFLD_CMD_FETCHRO | V_FW_EQ_OFLD_CMD_IQID(eq->iqid));
3782733b9277SNavdeep Parhar 	c.dcaen_to_eqsize =
3783733b9277SNavdeep Parhar 	    htobe32(V_FW_EQ_OFLD_CMD_FBMIN(X_FETCHBURSTMIN_64B) |
3784733b9277SNavdeep Parhar 		V_FW_EQ_OFLD_CMD_FBMAX(X_FETCHBURSTMAX_512B) |
3785ddf09ad6SNavdeep Parhar 		V_FW_EQ_OFLD_CMD_CIDXFTHRESH(qsize_to_fthresh(qsize)) |
37867951040fSNavdeep Parhar 		V_FW_EQ_OFLD_CMD_EQSIZE(qsize));
3787733b9277SNavdeep Parhar 	c.eqaddr = htobe64(eq->ba);
3788733b9277SNavdeep Parhar 
3789733b9277SNavdeep Parhar 	rc = -t4_wr_mbox(sc, sc->mbox, &c, sizeof(c), &c);
3790733b9277SNavdeep Parhar 	if (rc != 0) {
3791fe2ebb76SJohn Baldwin 		device_printf(vi->dev,
3792733b9277SNavdeep Parhar 		    "failed to create egress queue for TCP offload: %d\n", rc);
3793733b9277SNavdeep Parhar 		return (rc);
3794733b9277SNavdeep Parhar 	}
3795733b9277SNavdeep Parhar 	eq->flags |= EQ_ALLOCATED;
3796733b9277SNavdeep Parhar 
3797733b9277SNavdeep Parhar 	eq->cntxt_id = G_FW_EQ_OFLD_CMD_EQID(be32toh(c.eqid_pkd));
379854e4ee71SNavdeep Parhar 	cntxt_id = eq->cntxt_id - sc->sge.eq_start;
3799733b9277SNavdeep Parhar 	if (cntxt_id >= sc->sge.neq)
3800733b9277SNavdeep Parhar 	    panic("%s: eq->cntxt_id (%d) more than the max (%d)", __func__,
3801733b9277SNavdeep Parhar 		cntxt_id, sc->sge.neq - 1);
380254e4ee71SNavdeep Parhar 	sc->sge.eqmap[cntxt_id] = eq;
380354e4ee71SNavdeep Parhar 
3804733b9277SNavdeep Parhar 	return (rc);
3805733b9277SNavdeep Parhar }
3806733b9277SNavdeep Parhar #endif
3807733b9277SNavdeep Parhar 
3808733b9277SNavdeep Parhar static int
3809fe2ebb76SJohn Baldwin alloc_eq(struct adapter *sc, struct vi_info *vi, struct sge_eq *eq)
3810733b9277SNavdeep Parhar {
38117951040fSNavdeep Parhar 	int rc, qsize;
3812733b9277SNavdeep Parhar 	size_t len;
3813733b9277SNavdeep Parhar 
3814733b9277SNavdeep Parhar 	mtx_init(&eq->eq_lock, eq->lockname, NULL, MTX_DEF);
3815733b9277SNavdeep Parhar 
381690e7434aSNavdeep Parhar 	qsize = eq->sidx + sc->params.sge.spg_len / EQ_ESIZE;
38177951040fSNavdeep Parhar 	len = qsize * EQ_ESIZE;
3818733b9277SNavdeep Parhar 	rc = alloc_ring(sc, len, &eq->desc_tag, &eq->desc_map,
3819733b9277SNavdeep Parhar 	    &eq->ba, (void **)&eq->desc);
3820733b9277SNavdeep Parhar 	if (rc)
3821733b9277SNavdeep Parhar 		return (rc);
3822733b9277SNavdeep Parhar 
3823ddf09ad6SNavdeep Parhar 	eq->pidx = eq->cidx = eq->dbidx = 0;
3824ddf09ad6SNavdeep Parhar 	/* Note that equeqidx is not used with sge_wrq (OFLD/CTRL) queues. */
3825ddf09ad6SNavdeep Parhar 	eq->equeqidx = 0;
3826d14b0ac1SNavdeep Parhar 	eq->doorbells = sc->doorbells;
3827733b9277SNavdeep Parhar 
3828733b9277SNavdeep Parhar 	switch (eq->flags & EQ_TYPEMASK) {
3829733b9277SNavdeep Parhar 	case EQ_CTRL:
3830733b9277SNavdeep Parhar 		rc = ctrl_eq_alloc(sc, eq);
3831733b9277SNavdeep Parhar 		break;
3832733b9277SNavdeep Parhar 
3833733b9277SNavdeep Parhar 	case EQ_ETH:
3834fe2ebb76SJohn Baldwin 		rc = eth_eq_alloc(sc, vi, eq);
3835733b9277SNavdeep Parhar 		break;
3836733b9277SNavdeep Parhar 
3837eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
3838733b9277SNavdeep Parhar 	case EQ_OFLD:
3839fe2ebb76SJohn Baldwin 		rc = ofld_eq_alloc(sc, vi, eq);
3840733b9277SNavdeep Parhar 		break;
3841733b9277SNavdeep Parhar #endif
3842733b9277SNavdeep Parhar 
3843733b9277SNavdeep Parhar 	default:
3844733b9277SNavdeep Parhar 		panic("%s: invalid eq type %d.", __func__,
3845733b9277SNavdeep Parhar 		    eq->flags & EQ_TYPEMASK);
3846733b9277SNavdeep Parhar 	}
3847733b9277SNavdeep Parhar 	if (rc != 0) {
3848733b9277SNavdeep Parhar 		device_printf(sc->dev,
3849c086e3d1SNavdeep Parhar 		    "failed to allocate egress queue(%d): %d\n",
3850733b9277SNavdeep Parhar 		    eq->flags & EQ_TYPEMASK, rc);
3851733b9277SNavdeep Parhar 	}
3852733b9277SNavdeep Parhar 
3853d14b0ac1SNavdeep Parhar 	if (isset(&eq->doorbells, DOORBELL_UDB) ||
3854d14b0ac1SNavdeep Parhar 	    isset(&eq->doorbells, DOORBELL_UDBWC) ||
385577ad3c41SNavdeep Parhar 	    isset(&eq->doorbells, DOORBELL_WCWR)) {
385690e7434aSNavdeep Parhar 		uint32_t s_qpp = sc->params.sge.eq_s_qpp;
3857d14b0ac1SNavdeep Parhar 		uint32_t mask = (1 << s_qpp) - 1;
3858d14b0ac1SNavdeep Parhar 		volatile uint8_t *udb;
3859d14b0ac1SNavdeep Parhar 
3860d14b0ac1SNavdeep Parhar 		udb = sc->udbs_base + UDBS_DB_OFFSET;
3861d14b0ac1SNavdeep Parhar 		udb += (eq->cntxt_id >> s_qpp) << PAGE_SHIFT;	/* pg offset */
3862d14b0ac1SNavdeep Parhar 		eq->udb_qid = eq->cntxt_id & mask;		/* id in page */
3863f10405b3SNavdeep Parhar 		if (eq->udb_qid >= PAGE_SIZE / UDBS_SEG_SIZE)
386477ad3c41SNavdeep Parhar 	    		clrbit(&eq->doorbells, DOORBELL_WCWR);
3865d14b0ac1SNavdeep Parhar 		else {
3866d14b0ac1SNavdeep Parhar 			udb += eq->udb_qid << UDBS_SEG_SHIFT;	/* seg offset */
3867d14b0ac1SNavdeep Parhar 			eq->udb_qid = 0;
3868d14b0ac1SNavdeep Parhar 		}
3869d14b0ac1SNavdeep Parhar 		eq->udb = (volatile void *)udb;
3870d14b0ac1SNavdeep Parhar 	}
3871d14b0ac1SNavdeep Parhar 
3872733b9277SNavdeep Parhar 	return (rc);
3873733b9277SNavdeep Parhar }
3874733b9277SNavdeep Parhar 
3875733b9277SNavdeep Parhar static int
3876733b9277SNavdeep Parhar free_eq(struct adapter *sc, struct sge_eq *eq)
3877733b9277SNavdeep Parhar {
3878733b9277SNavdeep Parhar 	int rc;
3879733b9277SNavdeep Parhar 
3880733b9277SNavdeep Parhar 	if (eq->flags & EQ_ALLOCATED) {
3881733b9277SNavdeep Parhar 		switch (eq->flags & EQ_TYPEMASK) {
3882733b9277SNavdeep Parhar 		case EQ_CTRL:
3883733b9277SNavdeep Parhar 			rc = -t4_ctrl_eq_free(sc, sc->mbox, sc->pf, 0,
3884733b9277SNavdeep Parhar 			    eq->cntxt_id);
3885733b9277SNavdeep Parhar 			break;
3886733b9277SNavdeep Parhar 
3887733b9277SNavdeep Parhar 		case EQ_ETH:
3888733b9277SNavdeep Parhar 			rc = -t4_eth_eq_free(sc, sc->mbox, sc->pf, 0,
3889733b9277SNavdeep Parhar 			    eq->cntxt_id);
3890733b9277SNavdeep Parhar 			break;
3891733b9277SNavdeep Parhar 
3892eff62dbaSNavdeep Parhar #if defined(TCP_OFFLOAD) || defined(RATELIMIT)
3893733b9277SNavdeep Parhar 		case EQ_OFLD:
3894733b9277SNavdeep Parhar 			rc = -t4_ofld_eq_free(sc, sc->mbox, sc->pf, 0,
3895733b9277SNavdeep Parhar 			    eq->cntxt_id);
3896733b9277SNavdeep Parhar 			break;
3897733b9277SNavdeep Parhar #endif
3898733b9277SNavdeep Parhar 
3899733b9277SNavdeep Parhar 		default:
3900733b9277SNavdeep Parhar 			panic("%s: invalid eq type %d.", __func__,
3901733b9277SNavdeep Parhar 			    eq->flags & EQ_TYPEMASK);
3902733b9277SNavdeep Parhar 		}
3903733b9277SNavdeep Parhar 		if (rc != 0) {
3904733b9277SNavdeep Parhar 			device_printf(sc->dev,
3905733b9277SNavdeep Parhar 			    "failed to free egress queue (%d): %d\n",
3906733b9277SNavdeep Parhar 			    eq->flags & EQ_TYPEMASK, rc);
3907733b9277SNavdeep Parhar 			return (rc);
3908733b9277SNavdeep Parhar 		}
3909733b9277SNavdeep Parhar 		eq->flags &= ~EQ_ALLOCATED;
3910733b9277SNavdeep Parhar 	}
3911733b9277SNavdeep Parhar 
3912733b9277SNavdeep Parhar 	free_ring(sc, eq->desc_tag, eq->desc_map, eq->ba, eq->desc);
3913733b9277SNavdeep Parhar 
3914733b9277SNavdeep Parhar 	if (mtx_initialized(&eq->eq_lock))
3915733b9277SNavdeep Parhar 		mtx_destroy(&eq->eq_lock);
3916733b9277SNavdeep Parhar 
3917733b9277SNavdeep Parhar 	bzero(eq, sizeof(*eq));
3918733b9277SNavdeep Parhar 	return (0);
3919733b9277SNavdeep Parhar }
3920733b9277SNavdeep Parhar 
3921733b9277SNavdeep Parhar static int
3922fe2ebb76SJohn Baldwin alloc_wrq(struct adapter *sc, struct vi_info *vi, struct sge_wrq *wrq,
3923733b9277SNavdeep Parhar     struct sysctl_oid *oid)
3924733b9277SNavdeep Parhar {
3925733b9277SNavdeep Parhar 	int rc;
3926fe2ebb76SJohn Baldwin 	struct sysctl_ctx_list *ctx = vi ? &vi->ctx : &sc->ctx;
3927733b9277SNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
3928733b9277SNavdeep Parhar 
3929fe2ebb76SJohn Baldwin 	rc = alloc_eq(sc, vi, &wrq->eq);
3930733b9277SNavdeep Parhar 	if (rc)
3931733b9277SNavdeep Parhar 		return (rc);
3932733b9277SNavdeep Parhar 
3933733b9277SNavdeep Parhar 	wrq->adapter = sc;
39347951040fSNavdeep Parhar 	TASK_INIT(&wrq->wrq_tx_task, 0, wrq_tx_drain, wrq);
39357951040fSNavdeep Parhar 	TAILQ_INIT(&wrq->incomplete_wrs);
393609fe6320SNavdeep Parhar 	STAILQ_INIT(&wrq->wr_list);
39377951040fSNavdeep Parhar 	wrq->nwr_pending = 0;
39387951040fSNavdeep Parhar 	wrq->ndesc_needed = 0;
3939733b9277SNavdeep Parhar 
3940aa93b99aSNavdeep Parhar 	SYSCTL_ADD_UAUTO(ctx, children, OID_AUTO, "ba", CTLFLAG_RD,
3941aa93b99aSNavdeep Parhar 	    &wrq->eq.ba, "bus address of descriptor ring");
3942aa93b99aSNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "dmalen", CTLFLAG_RD, NULL,
3943aa93b99aSNavdeep Parhar 	    wrq->eq.sidx * EQ_ESIZE + sc->params.sge.spg_len,
3944aa93b99aSNavdeep Parhar 	    "desc ring size in bytes");
3945733b9277SNavdeep Parhar 	SYSCTL_ADD_UINT(ctx, children, OID_AUTO, "cntxt_id", CTLFLAG_RD,
3946733b9277SNavdeep Parhar 	    &wrq->eq.cntxt_id, 0, "SGE context id of the queue");
3947733b9277SNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "cidx",
3948733b9277SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &wrq->eq.cidx, 0, sysctl_uint16, "I",
3949733b9277SNavdeep Parhar 	    "consumer index");
3950733b9277SNavdeep Parhar 	SYSCTL_ADD_PROC(ctx, children, OID_AUTO, "pidx",
3951733b9277SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &wrq->eq.pidx, 0, sysctl_uint16, "I",
3952733b9277SNavdeep Parhar 	    "producer index");
3953aa93b99aSNavdeep Parhar 	SYSCTL_ADD_INT(ctx, children, OID_AUTO, "sidx", CTLFLAG_RD, NULL,
3954aa93b99aSNavdeep Parhar 	    wrq->eq.sidx, "status page index");
39557951040fSNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "tx_wrs_direct", CTLFLAG_RD,
39567951040fSNavdeep Parhar 	    &wrq->tx_wrs_direct, "# of work requests (direct)");
39577951040fSNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "tx_wrs_copied", CTLFLAG_RD,
39587951040fSNavdeep Parhar 	    &wrq->tx_wrs_copied, "# of work requests (copied)");
39590459a175SNavdeep Parhar 	SYSCTL_ADD_UQUAD(ctx, children, OID_AUTO, "tx_wrs_sspace", CTLFLAG_RD,
39600459a175SNavdeep Parhar 	    &wrq->tx_wrs_ss, "# of work requests (copied from scratch space)");
3961733b9277SNavdeep Parhar 
3962733b9277SNavdeep Parhar 	return (rc);
3963733b9277SNavdeep Parhar }
3964733b9277SNavdeep Parhar 
3965733b9277SNavdeep Parhar static int
3966733b9277SNavdeep Parhar free_wrq(struct adapter *sc, struct sge_wrq *wrq)
3967733b9277SNavdeep Parhar {
3968733b9277SNavdeep Parhar 	int rc;
3969733b9277SNavdeep Parhar 
3970733b9277SNavdeep Parhar 	rc = free_eq(sc, &wrq->eq);
3971733b9277SNavdeep Parhar 	if (rc)
3972733b9277SNavdeep Parhar 		return (rc);
3973733b9277SNavdeep Parhar 
3974733b9277SNavdeep Parhar 	bzero(wrq, sizeof(*wrq));
3975733b9277SNavdeep Parhar 	return (0);
3976733b9277SNavdeep Parhar }
3977733b9277SNavdeep Parhar 
3978733b9277SNavdeep Parhar static int
3979fe2ebb76SJohn Baldwin alloc_txq(struct vi_info *vi, struct sge_txq *txq, int idx,
3980733b9277SNavdeep Parhar     struct sysctl_oid *oid)
3981733b9277SNavdeep Parhar {
3982733b9277SNavdeep Parhar 	int rc;
3983fe2ebb76SJohn Baldwin 	struct port_info *pi = vi->pi;
3984733b9277SNavdeep Parhar 	struct adapter *sc = pi->adapter;
3985733b9277SNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
3986733b9277SNavdeep Parhar 	char name[16];
3987733b9277SNavdeep Parhar 	struct sysctl_oid_list *children = SYSCTL_CHILDREN(oid);
3988733b9277SNavdeep Parhar 
39897951040fSNavdeep Parhar 	rc = mp_ring_alloc(&txq->r, eq->sidx, txq, eth_tx, can_resume_eth_tx,
39907951040fSNavdeep Parhar 	    M_CXGBE, M_WAITOK);
39917951040fSNavdeep Parhar 	if (rc != 0) {
39927951040fSNavdeep Parhar 		device_printf(sc->dev, "failed to allocate mp_ring: %d\n", rc);
39937951040fSNavdeep Parhar 		return (rc);
39947951040fSNavdeep Parhar 	}
39957951040fSNavdeep Parhar 
3996fe2ebb76SJohn Baldwin 	rc = alloc_eq(sc, vi, eq);
39977951040fSNavdeep Parhar 	if (rc != 0) {
39987951040fSNavdeep Parhar 		mp_ring_free(txq->r);
39997951040fSNavdeep Parhar 		txq->r = NULL;
4000733b9277SNavdeep Parhar 		return (rc);
40017951040fSNavdeep Parhar 	}
4002733b9277SNavdeep Parhar 
40037951040fSNavdeep Parhar 	/* Can't fail after this point. */
40047951040fSNavdeep Parhar 
4005ec55567cSJohn Baldwin 	if (idx == 0)
4006ec55567cSJohn Baldwin 		sc->sge.eq_base = eq->abs_id - eq->cntxt_id;
4007ec55567cSJohn Baldwin 	else
4008ec55567cSJohn Baldwin 		KASSERT(eq->cntxt_id + sc->sge.eq_base == eq->abs_id,
4009ec55567cSJohn Baldwin 		    ("eq_base mismatch"));
4010ec55567cSJohn Baldwin 	KASSERT(sc->sge.eq_base == 0 || sc->flags & IS_VF,
4011ec55567cSJohn Baldwin 	    ("PF with non-zero eq_base"));
4012ec55567cSJohn Baldwin 
40137951040fSNavdeep Parhar 	TASK_INIT(&txq->tx_reclaim_task, 0, tx_reclaim, eq);
4014fe2ebb76SJohn Baldwin 	txq->ifp = vi->ifp;
40157951040fSNavdeep Parhar 	txq->gl = sglist_alloc(TX_SGL_SEGS, M_WAITOK);
40166af45170SJohn Baldwin 	if (sc->flags & IS_VF)
40176af45170SJohn Baldwin 		txq->cpl_ctrl0 = htobe32(V_TXPKT_OPCODE(CPL_TX_PKT_XT) |
40186af45170SJohn Baldwin 		    V_TXPKT_INTF(pi->tx_chan));
40196af45170SJohn Baldwin 	else
40207951040fSNavdeep Parhar 		txq->cpl_ctrl0 = htobe32(V_TXPKT_OPCODE(CPL_TX_PKT) |
402197f2919dSNavdeep Parhar 		    V_TXPKT_INTF(pi->tx_chan) |
402297f2919dSNavdeep Parhar 		    V_TXPKT_PF(G_FW_VIID_PFN(vi->viid)) |
402397f2919dSNavdeep Parhar 		    V_TXPKT_VF(G_FW_VIID_VIN(vi->viid)) |
402497f2919dSNavdeep Parhar 		    V_TXPKT_VF_VLD(G_FW_VIID_VIVLD(vi->viid)));
402502f972e8SNavdeep Parhar 	txq->tc_idx = -1;
40267951040fSNavdeep Parhar 	txq->sdesc = malloc(eq->sidx * sizeof(struct tx_sdesc), M_CXGBE,
4027733b9277SNavdeep Parhar 	    M_ZERO | M_WAITOK);
402854e4ee71SNavdeep Parhar 
402954e4ee71SNavdeep Parhar 	snprintf(name, sizeof(name), "%d", idx);
4030fe2ebb76SJohn Baldwin 	oid = SYSCTL_ADD_NODE(&vi->ctx, children, OID_AUTO, name, CTLFLAG_RD,
403154e4ee71SNavdeep Parhar 	    NULL, "tx queue");
403254e4ee71SNavdeep Parhar 	children = SYSCTL_CHILDREN(oid);
403354e4ee71SNavdeep Parhar 
4034aa93b99aSNavdeep Parhar 	SYSCTL_ADD_UAUTO(&vi->ctx, children, OID_AUTO, "ba", CTLFLAG_RD,
4035aa93b99aSNavdeep Parhar 	    &eq->ba, "bus address of descriptor ring");
4036aa93b99aSNavdeep Parhar 	SYSCTL_ADD_INT(&vi->ctx, children, OID_AUTO, "dmalen", CTLFLAG_RD, NULL,
4037aa93b99aSNavdeep Parhar 	    eq->sidx * EQ_ESIZE + sc->params.sge.spg_len,
4038aa93b99aSNavdeep Parhar 	    "desc ring size in bytes");
4039ec55567cSJohn Baldwin 	SYSCTL_ADD_UINT(&vi->ctx, children, OID_AUTO, "abs_id", CTLFLAG_RD,
4040ec55567cSJohn Baldwin 	    &eq->abs_id, 0, "absolute id of the queue");
4041fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UINT(&vi->ctx, children, OID_AUTO, "cntxt_id", CTLFLAG_RD,
404259bc8ce0SNavdeep Parhar 	    &eq->cntxt_id, 0, "SGE context id of the queue");
4043fe2ebb76SJohn Baldwin 	SYSCTL_ADD_PROC(&vi->ctx, children, OID_AUTO, "cidx",
404459bc8ce0SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &eq->cidx, 0, sysctl_uint16, "I",
404559bc8ce0SNavdeep Parhar 	    "consumer index");
4046fe2ebb76SJohn Baldwin 	SYSCTL_ADD_PROC(&vi->ctx, children, OID_AUTO, "pidx",
404759bc8ce0SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RD, &eq->pidx, 0, sysctl_uint16, "I",
404859bc8ce0SNavdeep Parhar 	    "producer index");
4049aa93b99aSNavdeep Parhar 	SYSCTL_ADD_INT(&vi->ctx, children, OID_AUTO, "sidx", CTLFLAG_RD, NULL,
4050aa93b99aSNavdeep Parhar 	    eq->sidx, "status page index");
405159bc8ce0SNavdeep Parhar 
405202f972e8SNavdeep Parhar 	SYSCTL_ADD_PROC(&vi->ctx, children, OID_AUTO, "tc",
405302f972e8SNavdeep Parhar 	    CTLTYPE_INT | CTLFLAG_RW, vi, idx, sysctl_tc, "I",
405402f972e8SNavdeep Parhar 	    "traffic class (-1 means none)");
405502f972e8SNavdeep Parhar 
4056fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txcsum", CTLFLAG_RD,
405754e4ee71SNavdeep Parhar 	    &txq->txcsum, "# of times hardware assisted with checksum");
4058fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "vlan_insertion",
405954e4ee71SNavdeep Parhar 	    CTLFLAG_RD, &txq->vlan_insertion,
406054e4ee71SNavdeep Parhar 	    "# of times hardware inserted 802.1Q tag");
4061fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "tso_wrs", CTLFLAG_RD,
4062a1ea9a82SNavdeep Parhar 	    &txq->tso_wrs, "# of TSO work requests");
4063fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "imm_wrs", CTLFLAG_RD,
406454e4ee71SNavdeep Parhar 	    &txq->imm_wrs, "# of work requests with immediate data");
4065fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "sgl_wrs", CTLFLAG_RD,
406654e4ee71SNavdeep Parhar 	    &txq->sgl_wrs, "# of work requests with direct SGL");
4067fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txpkt_wrs", CTLFLAG_RD,
406854e4ee71SNavdeep Parhar 	    &txq->txpkt_wrs, "# of txpkt work requests (one pkt/WR)");
4069fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txpkts0_wrs",
40707951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->txpkts0_wrs,
40717951040fSNavdeep Parhar 	    "# of txpkts (type 0) work requests");
4072fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txpkts1_wrs",
40737951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->txpkts1_wrs,
40747951040fSNavdeep Parhar 	    "# of txpkts (type 1) work requests");
4075fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txpkts0_pkts",
40767951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->txpkts0_pkts,
40777951040fSNavdeep Parhar 	    "# of frames tx'd using type0 txpkts work requests");
4078fe2ebb76SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "txpkts1_pkts",
40797951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->txpkts1_pkts,
40807951040fSNavdeep Parhar 	    "# of frames tx'd using type1 txpkts work requests");
4081*5cdaef71SJohn Baldwin 	SYSCTL_ADD_UQUAD(&vi->ctx, children, OID_AUTO, "raw_wrs", CTLFLAG_RD,
4082*5cdaef71SJohn Baldwin 	    &txq->raw_wrs, "# of raw work requests (non-packets)");
408354e4ee71SNavdeep Parhar 
4084fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_enqueues",
40857951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->enqueues,
40867951040fSNavdeep Parhar 	    "# of enqueues to the mp_ring for this queue");
4087fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_drops",
40887951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->drops,
40897951040fSNavdeep Parhar 	    "# of drops in the mp_ring for this queue");
4090fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_starts",
40917951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->starts,
40927951040fSNavdeep Parhar 	    "# of normal consumer starts in the mp_ring for this queue");
4093fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_stalls",
40947951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->stalls,
40957951040fSNavdeep Parhar 	    "# of consumer stalls in the mp_ring for this queue");
4096fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_restarts",
40977951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->restarts,
40987951040fSNavdeep Parhar 	    "# of consumer restarts in the mp_ring for this queue");
4099fe2ebb76SJohn Baldwin 	SYSCTL_ADD_COUNTER_U64(&vi->ctx, children, OID_AUTO, "r_abdications",
41007951040fSNavdeep Parhar 	    CTLFLAG_RD, &txq->r->abdications,
41017951040fSNavdeep Parhar 	    "# of consumer abdications in the mp_ring for this queue");
410254e4ee71SNavdeep Parhar 
41037951040fSNavdeep Parhar 	return (0);
410454e4ee71SNavdeep Parhar }
410554e4ee71SNavdeep Parhar 
410654e4ee71SNavdeep Parhar static int
4107fe2ebb76SJohn Baldwin free_txq(struct vi_info *vi, struct sge_txq *txq)
410854e4ee71SNavdeep Parhar {
410954e4ee71SNavdeep Parhar 	int rc;
4110fe2ebb76SJohn Baldwin 	struct adapter *sc = vi->pi->adapter;
411154e4ee71SNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
411254e4ee71SNavdeep Parhar 
4113733b9277SNavdeep Parhar 	rc = free_eq(sc, eq);
4114733b9277SNavdeep Parhar 	if (rc)
411554e4ee71SNavdeep Parhar 		return (rc);
411654e4ee71SNavdeep Parhar 
41177951040fSNavdeep Parhar 	sglist_free(txq->gl);
4118f7dfe243SNavdeep Parhar 	free(txq->sdesc, M_CXGBE);
41197951040fSNavdeep Parhar 	mp_ring_free(txq->r);
412054e4ee71SNavdeep Parhar 
412154e4ee71SNavdeep Parhar 	bzero(txq, sizeof(*txq));
412254e4ee71SNavdeep Parhar 	return (0);
412354e4ee71SNavdeep Parhar }
412454e4ee71SNavdeep Parhar 
412554e4ee71SNavdeep Parhar static void
412654e4ee71SNavdeep Parhar oneseg_dma_callback(void *arg, bus_dma_segment_t *segs, int nseg, int error)
412754e4ee71SNavdeep Parhar {
412854e4ee71SNavdeep Parhar 	bus_addr_t *ba = arg;
412954e4ee71SNavdeep Parhar 
413054e4ee71SNavdeep Parhar 	KASSERT(nseg == 1,
413154e4ee71SNavdeep Parhar 	    ("%s meant for single segment mappings only.", __func__));
413254e4ee71SNavdeep Parhar 
413354e4ee71SNavdeep Parhar 	*ba = error ? 0 : segs->ds_addr;
413454e4ee71SNavdeep Parhar }
413554e4ee71SNavdeep Parhar 
413654e4ee71SNavdeep Parhar static inline void
413754e4ee71SNavdeep Parhar ring_fl_db(struct adapter *sc, struct sge_fl *fl)
413854e4ee71SNavdeep Parhar {
41394d6db4e0SNavdeep Parhar 	uint32_t n, v;
414054e4ee71SNavdeep Parhar 
41414d6db4e0SNavdeep Parhar 	n = IDXDIFF(fl->pidx / 8, fl->dbidx, fl->sidx);
41424d6db4e0SNavdeep Parhar 	MPASS(n > 0);
4143d14b0ac1SNavdeep Parhar 
414454e4ee71SNavdeep Parhar 	wmb();
41454d6db4e0SNavdeep Parhar 	v = fl->dbval | V_PIDX(n);
41464d6db4e0SNavdeep Parhar 	if (fl->udb)
41474d6db4e0SNavdeep Parhar 		*fl->udb = htole32(v);
41484d6db4e0SNavdeep Parhar 	else
4149315048f2SJohn Baldwin 		t4_write_reg(sc, sc->sge_kdoorbell_reg, v);
41504d6db4e0SNavdeep Parhar 	IDXINCR(fl->dbidx, n, fl->sidx);
415154e4ee71SNavdeep Parhar }
415254e4ee71SNavdeep Parhar 
4153fb12416cSNavdeep Parhar /*
41544d6db4e0SNavdeep Parhar  * Fills up the freelist by allocating up to 'n' buffers.  Buffers that are
41554d6db4e0SNavdeep Parhar  * recycled do not count towards this allocation budget.
4156733b9277SNavdeep Parhar  *
41574d6db4e0SNavdeep Parhar  * Returns non-zero to indicate that this freelist should be added to the list
41584d6db4e0SNavdeep Parhar  * of starving freelists.
4159fb12416cSNavdeep Parhar  */
4160733b9277SNavdeep Parhar static int
41614d6db4e0SNavdeep Parhar refill_fl(struct adapter *sc, struct sge_fl *fl, int n)
416254e4ee71SNavdeep Parhar {
41634d6db4e0SNavdeep Parhar 	__be64 *d;
41644d6db4e0SNavdeep Parhar 	struct fl_sdesc *sd;
416538035ed6SNavdeep Parhar 	uintptr_t pa;
416654e4ee71SNavdeep Parhar 	caddr_t cl;
41674d6db4e0SNavdeep Parhar 	struct cluster_layout *cll;
41684d6db4e0SNavdeep Parhar 	struct sw_zone_info *swz;
416938035ed6SNavdeep Parhar 	struct cluster_metadata *clm;
41704d6db4e0SNavdeep Parhar 	uint16_t max_pidx;
41714d6db4e0SNavdeep Parhar 	uint16_t hw_cidx = fl->hw_cidx;		/* stable snapshot */
417254e4ee71SNavdeep Parhar 
417354e4ee71SNavdeep Parhar 	FL_LOCK_ASSERT_OWNED(fl);
417454e4ee71SNavdeep Parhar 
41754d6db4e0SNavdeep Parhar 	/*
4176453130d9SPedro F. Giffuni 	 * We always stop at the beginning of the hardware descriptor that's just
41774d6db4e0SNavdeep Parhar 	 * before the one with the hw cidx.  This is to avoid hw pidx = hw cidx,
41784d6db4e0SNavdeep Parhar 	 * which would mean an empty freelist to the chip.
41794d6db4e0SNavdeep Parhar 	 */
41804d6db4e0SNavdeep Parhar 	max_pidx = __predict_false(hw_cidx == 0) ? fl->sidx - 1 : hw_cidx - 1;
41814d6db4e0SNavdeep Parhar 	if (fl->pidx == max_pidx * 8)
41824d6db4e0SNavdeep Parhar 		return (0);
418354e4ee71SNavdeep Parhar 
41844d6db4e0SNavdeep Parhar 	d = &fl->desc[fl->pidx];
41854d6db4e0SNavdeep Parhar 	sd = &fl->sdesc[fl->pidx];
41864d6db4e0SNavdeep Parhar 	cll = &fl->cll_def;	/* default layout */
41874d6db4e0SNavdeep Parhar 	swz = &sc->sge.sw_zone_info[cll->zidx];
41884d6db4e0SNavdeep Parhar 
41894d6db4e0SNavdeep Parhar 	while (n > 0) {
419054e4ee71SNavdeep Parhar 
419154e4ee71SNavdeep Parhar 		if (sd->cl != NULL) {
419254e4ee71SNavdeep Parhar 
4193c3fb7725SNavdeep Parhar 			if (sd->nmbuf == 0) {
419438035ed6SNavdeep Parhar 				/*
419538035ed6SNavdeep Parhar 				 * Fast recycle without involving any atomics on
419638035ed6SNavdeep Parhar 				 * the cluster's metadata (if the cluster has
419738035ed6SNavdeep Parhar 				 * metadata).  This happens when all frames
419838035ed6SNavdeep Parhar 				 * received in the cluster were small enough to
419938035ed6SNavdeep Parhar 				 * fit within a single mbuf each.
420038035ed6SNavdeep Parhar 				 */
420138035ed6SNavdeep Parhar 				fl->cl_fast_recycled++;
4202ccc69b2fSNavdeep Parhar #ifdef INVARIANTS
4203ccc69b2fSNavdeep Parhar 				clm = cl_metadata(sc, fl, &sd->cll, sd->cl);
4204ccc69b2fSNavdeep Parhar 				if (clm != NULL)
4205ccc69b2fSNavdeep Parhar 					MPASS(clm->refcount == 1);
4206ccc69b2fSNavdeep Parhar #endif
420738035ed6SNavdeep Parhar 				goto recycled_fast;
420838035ed6SNavdeep Parhar 			}
420954e4ee71SNavdeep Parhar 
421038035ed6SNavdeep Parhar 			/*
421138035ed6SNavdeep Parhar 			 * Cluster is guaranteed to have metadata.  Clusters
421238035ed6SNavdeep Parhar 			 * without metadata always take the fast recycle path
421338035ed6SNavdeep Parhar 			 * when they're recycled.
421438035ed6SNavdeep Parhar 			 */
421538035ed6SNavdeep Parhar 			clm = cl_metadata(sc, fl, &sd->cll, sd->cl);
421638035ed6SNavdeep Parhar 			MPASS(clm != NULL);
42171458bff9SNavdeep Parhar 
421838035ed6SNavdeep Parhar 			if (atomic_fetchadd_int(&clm->refcount, -1) == 1) {
421938035ed6SNavdeep Parhar 				fl->cl_recycled++;
422082eff304SNavdeep Parhar 				counter_u64_add(extfree_rels, 1);
422154e4ee71SNavdeep Parhar 				goto recycled;
422254e4ee71SNavdeep Parhar 			}
42231458bff9SNavdeep Parhar 			sd->cl = NULL;	/* gave up my reference */
42241458bff9SNavdeep Parhar 		}
422538035ed6SNavdeep Parhar 		MPASS(sd->cl == NULL);
422638035ed6SNavdeep Parhar alloc:
422738035ed6SNavdeep Parhar 		cl = uma_zalloc(swz->zone, M_NOWAIT);
422838035ed6SNavdeep Parhar 		if (__predict_false(cl == NULL)) {
422938035ed6SNavdeep Parhar 			if (cll == &fl->cll_alt || fl->cll_alt.zidx == -1 ||
423038035ed6SNavdeep Parhar 			    fl->cll_def.zidx == fl->cll_alt.zidx)
423154e4ee71SNavdeep Parhar 				break;
423254e4ee71SNavdeep Parhar 
423338035ed6SNavdeep Parhar 			/* fall back to the safe zone */
423438035ed6SNavdeep Parhar 			cll = &fl->cll_alt;
423538035ed6SNavdeep Parhar 			swz = &sc->sge.sw_zone_info[cll->zidx];
423638035ed6SNavdeep Parhar 			goto alloc;
423754e4ee71SNavdeep Parhar 		}
423838035ed6SNavdeep Parhar 		fl->cl_allocated++;
42394d6db4e0SNavdeep Parhar 		n--;
424054e4ee71SNavdeep Parhar 
424138035ed6SNavdeep Parhar 		pa = pmap_kextract((vm_offset_t)cl);
424238035ed6SNavdeep Parhar 		pa += cll->region1;
424354e4ee71SNavdeep Parhar 		sd->cl = cl;
424438035ed6SNavdeep Parhar 		sd->cll = *cll;
424538035ed6SNavdeep Parhar 		*d = htobe64(pa | cll->hwidx);
424638035ed6SNavdeep Parhar 		clm = cl_metadata(sc, fl, cll, cl);
424738035ed6SNavdeep Parhar 		if (clm != NULL) {
42487d29df59SNavdeep Parhar recycled:
424938035ed6SNavdeep Parhar #ifdef INVARIANTS
425038035ed6SNavdeep Parhar 			clm->sd = sd;
425138035ed6SNavdeep Parhar #endif
425238035ed6SNavdeep Parhar 			clm->refcount = 1;
425338035ed6SNavdeep Parhar 		}
4254c3fb7725SNavdeep Parhar 		sd->nmbuf = 0;
425538035ed6SNavdeep Parhar recycled_fast:
425638035ed6SNavdeep Parhar 		d++;
425754e4ee71SNavdeep Parhar 		sd++;
42584d6db4e0SNavdeep Parhar 		if (__predict_false(++fl->pidx % 8 == 0)) {
42594d6db4e0SNavdeep Parhar 			uint16_t pidx = fl->pidx / 8;
42604d6db4e0SNavdeep Parhar 
42614d6db4e0SNavdeep Parhar 			if (__predict_false(pidx == fl->sidx)) {
426254e4ee71SNavdeep Parhar 				fl->pidx = 0;
42634d6db4e0SNavdeep Parhar 				pidx = 0;
426454e4ee71SNavdeep Parhar 				sd = fl->sdesc;
426554e4ee71SNavdeep Parhar 				d = fl->desc;
426654e4ee71SNavdeep Parhar 			}
42674d6db4e0SNavdeep Parhar 			if (pidx == max_pidx)
42684d6db4e0SNavdeep Parhar 				break;
42694d6db4e0SNavdeep Parhar 
42704d6db4e0SNavdeep Parhar 			if (IDXDIFF(pidx, fl->dbidx, fl->sidx) >= 4)
42714d6db4e0SNavdeep Parhar 				ring_fl_db(sc, fl);
42724d6db4e0SNavdeep Parhar 		}
427354e4ee71SNavdeep Parhar 	}
4274fb12416cSNavdeep Parhar 
42754d6db4e0SNavdeep Parhar 	if (fl->pidx / 8 != fl->dbidx)
4276fb12416cSNavdeep Parhar 		ring_fl_db(sc, fl);
4277733b9277SNavdeep Parhar 
4278733b9277SNavdeep Parhar 	return (FL_RUNNING_LOW(fl) && !(fl->flags & FL_STARVING));
4279733b9277SNavdeep Parhar }
4280733b9277SNavdeep Parhar 
4281733b9277SNavdeep Parhar /*
4282733b9277SNavdeep Parhar  * Attempt to refill all starving freelists.
4283733b9277SNavdeep Parhar  */
4284733b9277SNavdeep Parhar static void
4285733b9277SNavdeep Parhar refill_sfl(void *arg)
4286733b9277SNavdeep Parhar {
4287733b9277SNavdeep Parhar 	struct adapter *sc = arg;
4288733b9277SNavdeep Parhar 	struct sge_fl *fl, *fl_temp;
4289733b9277SNavdeep Parhar 
4290fe2ebb76SJohn Baldwin 	mtx_assert(&sc->sfl_lock, MA_OWNED);
4291733b9277SNavdeep Parhar 	TAILQ_FOREACH_SAFE(fl, &sc->sfl, link, fl_temp) {
4292733b9277SNavdeep Parhar 		FL_LOCK(fl);
4293733b9277SNavdeep Parhar 		refill_fl(sc, fl, 64);
4294733b9277SNavdeep Parhar 		if (FL_NOT_RUNNING_LOW(fl) || fl->flags & FL_DOOMED) {
4295733b9277SNavdeep Parhar 			TAILQ_REMOVE(&sc->sfl, fl, link);
4296733b9277SNavdeep Parhar 			fl->flags &= ~FL_STARVING;
4297733b9277SNavdeep Parhar 		}
4298733b9277SNavdeep Parhar 		FL_UNLOCK(fl);
4299733b9277SNavdeep Parhar 	}
4300733b9277SNavdeep Parhar 
4301733b9277SNavdeep Parhar 	if (!TAILQ_EMPTY(&sc->sfl))
4302733b9277SNavdeep Parhar 		callout_schedule(&sc->sfl_callout, hz / 5);
430354e4ee71SNavdeep Parhar }
430454e4ee71SNavdeep Parhar 
430554e4ee71SNavdeep Parhar static int
430654e4ee71SNavdeep Parhar alloc_fl_sdesc(struct sge_fl *fl)
430754e4ee71SNavdeep Parhar {
430854e4ee71SNavdeep Parhar 
43094d6db4e0SNavdeep Parhar 	fl->sdesc = malloc(fl->sidx * 8 * sizeof(struct fl_sdesc), M_CXGBE,
431054e4ee71SNavdeep Parhar 	    M_ZERO | M_WAITOK);
431154e4ee71SNavdeep Parhar 
431254e4ee71SNavdeep Parhar 	return (0);
431354e4ee71SNavdeep Parhar }
431454e4ee71SNavdeep Parhar 
431554e4ee71SNavdeep Parhar static void
43161458bff9SNavdeep Parhar free_fl_sdesc(struct adapter *sc, struct sge_fl *fl)
431754e4ee71SNavdeep Parhar {
431854e4ee71SNavdeep Parhar 	struct fl_sdesc *sd;
431938035ed6SNavdeep Parhar 	struct cluster_metadata *clm;
432038035ed6SNavdeep Parhar 	struct cluster_layout *cll;
432154e4ee71SNavdeep Parhar 	int i;
432254e4ee71SNavdeep Parhar 
432354e4ee71SNavdeep Parhar 	sd = fl->sdesc;
43244d6db4e0SNavdeep Parhar 	for (i = 0; i < fl->sidx * 8; i++, sd++) {
432538035ed6SNavdeep Parhar 		if (sd->cl == NULL)
432638035ed6SNavdeep Parhar 			continue;
432754e4ee71SNavdeep Parhar 
432838035ed6SNavdeep Parhar 		cll = &sd->cll;
432938035ed6SNavdeep Parhar 		clm = cl_metadata(sc, fl, cll, sd->cl);
433082eff304SNavdeep Parhar 		if (sd->nmbuf == 0)
433138035ed6SNavdeep Parhar 			uma_zfree(sc->sge.sw_zone_info[cll->zidx].zone, sd->cl);
433282eff304SNavdeep Parhar 		else if (clm && atomic_fetchadd_int(&clm->refcount, -1) == 1) {
433382eff304SNavdeep Parhar 			uma_zfree(sc->sge.sw_zone_info[cll->zidx].zone, sd->cl);
433482eff304SNavdeep Parhar 			counter_u64_add(extfree_rels, 1);
433554e4ee71SNavdeep Parhar 		}
433638035ed6SNavdeep Parhar 		sd->cl = NULL;
433754e4ee71SNavdeep Parhar 	}
433854e4ee71SNavdeep Parhar 
433954e4ee71SNavdeep Parhar 	free(fl->sdesc, M_CXGBE);
434054e4ee71SNavdeep Parhar 	fl->sdesc = NULL;
434154e4ee71SNavdeep Parhar }
434254e4ee71SNavdeep Parhar 
43437951040fSNavdeep Parhar static inline void
43447951040fSNavdeep Parhar get_pkt_gl(struct mbuf *m, struct sglist *gl)
434554e4ee71SNavdeep Parhar {
43467951040fSNavdeep Parhar 	int rc;
434754e4ee71SNavdeep Parhar 
43487951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m);
434954e4ee71SNavdeep Parhar 
43507951040fSNavdeep Parhar 	sglist_reset(gl);
43517951040fSNavdeep Parhar 	rc = sglist_append_mbuf(gl, m);
43527951040fSNavdeep Parhar 	if (__predict_false(rc != 0)) {
43537951040fSNavdeep Parhar 		panic("%s: mbuf %p (%d segs) was vetted earlier but now fails "
43547951040fSNavdeep Parhar 		    "with %d.", __func__, m, mbuf_nsegs(m), rc);
435554e4ee71SNavdeep Parhar 	}
435654e4ee71SNavdeep Parhar 
43577951040fSNavdeep Parhar 	KASSERT(gl->sg_nseg == mbuf_nsegs(m),
43587951040fSNavdeep Parhar 	    ("%s: nsegs changed for mbuf %p from %d to %d", __func__, m,
43597951040fSNavdeep Parhar 	    mbuf_nsegs(m), gl->sg_nseg));
43607951040fSNavdeep Parhar 	KASSERT(gl->sg_nseg > 0 &&
43617951040fSNavdeep Parhar 	    gl->sg_nseg <= (needs_tso(m) ? TX_SGL_SEGS_TSO : TX_SGL_SEGS),
43627951040fSNavdeep Parhar 	    ("%s: %d segments, should have been 1 <= nsegs <= %d", __func__,
43637951040fSNavdeep Parhar 		gl->sg_nseg, needs_tso(m) ? TX_SGL_SEGS_TSO : TX_SGL_SEGS));
436454e4ee71SNavdeep Parhar }
436554e4ee71SNavdeep Parhar 
436654e4ee71SNavdeep Parhar /*
43677951040fSNavdeep Parhar  * len16 for a txpkt WR with a GL.  Includes the firmware work request header.
436854e4ee71SNavdeep Parhar  */
43697951040fSNavdeep Parhar static inline u_int
43707951040fSNavdeep Parhar txpkt_len16(u_int nsegs, u_int tso)
43717951040fSNavdeep Parhar {
43727951040fSNavdeep Parhar 	u_int n;
43737951040fSNavdeep Parhar 
43747951040fSNavdeep Parhar 	MPASS(nsegs > 0);
43757951040fSNavdeep Parhar 
43767951040fSNavdeep Parhar 	nsegs--; /* first segment is part of ulptx_sgl */
43777951040fSNavdeep Parhar 	n = sizeof(struct fw_eth_tx_pkt_wr) + sizeof(struct cpl_tx_pkt_core) +
43787951040fSNavdeep Parhar 	    sizeof(struct ulptx_sgl) + 8 * ((3 * nsegs) / 2 + (nsegs & 1));
43797951040fSNavdeep Parhar 	if (tso)
43807951040fSNavdeep Parhar 		n += sizeof(struct cpl_tx_pkt_lso_core);
43817951040fSNavdeep Parhar 
43827951040fSNavdeep Parhar 	return (howmany(n, 16));
43837951040fSNavdeep Parhar }
438454e4ee71SNavdeep Parhar 
438554e4ee71SNavdeep Parhar /*
43866af45170SJohn Baldwin  * len16 for a txpkt_vm WR with a GL.  Includes the firmware work
43876af45170SJohn Baldwin  * request header.
43886af45170SJohn Baldwin  */
43896af45170SJohn Baldwin static inline u_int
43906af45170SJohn Baldwin txpkt_vm_len16(u_int nsegs, u_int tso)
43916af45170SJohn Baldwin {
43926af45170SJohn Baldwin 	u_int n;
43936af45170SJohn Baldwin 
43946af45170SJohn Baldwin 	MPASS(nsegs > 0);
43956af45170SJohn Baldwin 
43966af45170SJohn Baldwin 	nsegs--; /* first segment is part of ulptx_sgl */
43976af45170SJohn Baldwin 	n = sizeof(struct fw_eth_tx_pkt_vm_wr) +
43986af45170SJohn Baldwin 	    sizeof(struct cpl_tx_pkt_core) +
43996af45170SJohn Baldwin 	    sizeof(struct ulptx_sgl) + 8 * ((3 * nsegs) / 2 + (nsegs & 1));
44006af45170SJohn Baldwin 	if (tso)
44016af45170SJohn Baldwin 		n += sizeof(struct cpl_tx_pkt_lso_core);
44026af45170SJohn Baldwin 
44036af45170SJohn Baldwin 	return (howmany(n, 16));
44046af45170SJohn Baldwin }
44056af45170SJohn Baldwin 
44066af45170SJohn Baldwin /*
44077951040fSNavdeep Parhar  * len16 for a txpkts type 0 WR with a GL.  Does not include the firmware work
44087951040fSNavdeep Parhar  * request header.
44097951040fSNavdeep Parhar  */
44107951040fSNavdeep Parhar static inline u_int
44117951040fSNavdeep Parhar txpkts0_len16(u_int nsegs)
44127951040fSNavdeep Parhar {
44137951040fSNavdeep Parhar 	u_int n;
44147951040fSNavdeep Parhar 
44157951040fSNavdeep Parhar 	MPASS(nsegs > 0);
44167951040fSNavdeep Parhar 
44177951040fSNavdeep Parhar 	nsegs--; /* first segment is part of ulptx_sgl */
44187951040fSNavdeep Parhar 	n = sizeof(struct ulp_txpkt) + sizeof(struct ulptx_idata) +
44197951040fSNavdeep Parhar 	    sizeof(struct cpl_tx_pkt_core) + sizeof(struct ulptx_sgl) +
44207951040fSNavdeep Parhar 	    8 * ((3 * nsegs) / 2 + (nsegs & 1));
44217951040fSNavdeep Parhar 
44227951040fSNavdeep Parhar 	return (howmany(n, 16));
44237951040fSNavdeep Parhar }
44247951040fSNavdeep Parhar 
44257951040fSNavdeep Parhar /*
44267951040fSNavdeep Parhar  * len16 for a txpkts type 1 WR with a GL.  Does not include the firmware work
44277951040fSNavdeep Parhar  * request header.
44287951040fSNavdeep Parhar  */
44297951040fSNavdeep Parhar static inline u_int
44307951040fSNavdeep Parhar txpkts1_len16(void)
44317951040fSNavdeep Parhar {
44327951040fSNavdeep Parhar 	u_int n;
44337951040fSNavdeep Parhar 
44347951040fSNavdeep Parhar 	n = sizeof(struct cpl_tx_pkt_core) + sizeof(struct ulptx_sgl);
44357951040fSNavdeep Parhar 
44367951040fSNavdeep Parhar 	return (howmany(n, 16));
44377951040fSNavdeep Parhar }
44387951040fSNavdeep Parhar 
44397951040fSNavdeep Parhar static inline u_int
44407951040fSNavdeep Parhar imm_payload(u_int ndesc)
44417951040fSNavdeep Parhar {
44427951040fSNavdeep Parhar 	u_int n;
44437951040fSNavdeep Parhar 
44447951040fSNavdeep Parhar 	n = ndesc * EQ_ESIZE - sizeof(struct fw_eth_tx_pkt_wr) -
44457951040fSNavdeep Parhar 	    sizeof(struct cpl_tx_pkt_core);
44467951040fSNavdeep Parhar 
44477951040fSNavdeep Parhar 	return (n);
44487951040fSNavdeep Parhar }
44497951040fSNavdeep Parhar 
44507951040fSNavdeep Parhar /*
44516af45170SJohn Baldwin  * Write a VM txpkt WR for this packet to the hardware descriptors, update the
44526af45170SJohn Baldwin  * software descriptor, and advance the pidx.  It is guaranteed that enough
44536af45170SJohn Baldwin  * descriptors are available.
44546af45170SJohn Baldwin  *
44556af45170SJohn Baldwin  * The return value is the # of hardware descriptors used.
44566af45170SJohn Baldwin  */
44576af45170SJohn Baldwin static u_int
4458472a6004SNavdeep Parhar write_txpkt_vm_wr(struct adapter *sc, struct sge_txq *txq,
4459472a6004SNavdeep Parhar     struct fw_eth_tx_pkt_vm_wr *wr, struct mbuf *m0, u_int available)
44606af45170SJohn Baldwin {
44616af45170SJohn Baldwin 	struct sge_eq *eq = &txq->eq;
44626af45170SJohn Baldwin 	struct tx_sdesc *txsd;
44636af45170SJohn Baldwin 	struct cpl_tx_pkt_core *cpl;
44646af45170SJohn Baldwin 	uint32_t ctrl;	/* used in many unrelated places */
44656af45170SJohn Baldwin 	uint64_t ctrl1;
44666af45170SJohn Baldwin 	int csum_type, len16, ndesc, pktlen, nsegs;
44676af45170SJohn Baldwin 	caddr_t dst;
44686af45170SJohn Baldwin 
44696af45170SJohn Baldwin 	TXQ_LOCK_ASSERT_OWNED(txq);
44706af45170SJohn Baldwin 	M_ASSERTPKTHDR(m0);
44716af45170SJohn Baldwin 	MPASS(available > 0 && available < eq->sidx);
44726af45170SJohn Baldwin 
44736af45170SJohn Baldwin 	len16 = mbuf_len16(m0);
44746af45170SJohn Baldwin 	nsegs = mbuf_nsegs(m0);
44756af45170SJohn Baldwin 	pktlen = m0->m_pkthdr.len;
44766af45170SJohn Baldwin 	ctrl = sizeof(struct cpl_tx_pkt_core);
44776af45170SJohn Baldwin 	if (needs_tso(m0))
44786af45170SJohn Baldwin 		ctrl += sizeof(struct cpl_tx_pkt_lso_core);
44796af45170SJohn Baldwin 	ndesc = howmany(len16, EQ_ESIZE / 16);
44806af45170SJohn Baldwin 	MPASS(ndesc <= available);
44816af45170SJohn Baldwin 
44826af45170SJohn Baldwin 	/* Firmware work request header */
44836af45170SJohn Baldwin 	MPASS(wr == (void *)&eq->desc[eq->pidx]);
44846af45170SJohn Baldwin 	wr->op_immdlen = htobe32(V_FW_WR_OP(FW_ETH_TX_PKT_VM_WR) |
44856af45170SJohn Baldwin 	    V_FW_ETH_TX_PKT_WR_IMMDLEN(ctrl));
44866af45170SJohn Baldwin 
44876af45170SJohn Baldwin 	ctrl = V_FW_WR_LEN16(len16);
44886af45170SJohn Baldwin 	wr->equiq_to_len16 = htobe32(ctrl);
44896af45170SJohn Baldwin 	wr->r3[0] = 0;
44906af45170SJohn Baldwin 	wr->r3[1] = 0;
44916af45170SJohn Baldwin 
44926af45170SJohn Baldwin 	/*
44936af45170SJohn Baldwin 	 * Copy over ethmacdst, ethmacsrc, ethtype, and vlantci.
44946af45170SJohn Baldwin 	 * vlantci is ignored unless the ethtype is 0x8100, so it's
44956af45170SJohn Baldwin 	 * simpler to always copy it rather than making it
44966af45170SJohn Baldwin 	 * conditional.  Also, it seems that we do not have to set
44976af45170SJohn Baldwin 	 * vlantci or fake the ethtype when doing VLAN tag insertion.
44986af45170SJohn Baldwin 	 */
44996af45170SJohn Baldwin 	m_copydata(m0, 0, sizeof(struct ether_header) + 2, wr->ethmacdst);
45006af45170SJohn Baldwin 
45016af45170SJohn Baldwin 	csum_type = -1;
45026af45170SJohn Baldwin 	if (needs_tso(m0)) {
45036af45170SJohn Baldwin 		struct cpl_tx_pkt_lso_core *lso = (void *)(wr + 1);
45046af45170SJohn Baldwin 
45056af45170SJohn Baldwin 		KASSERT(m0->m_pkthdr.l2hlen > 0 && m0->m_pkthdr.l3hlen > 0 &&
45066af45170SJohn Baldwin 		    m0->m_pkthdr.l4hlen > 0,
45076af45170SJohn Baldwin 		    ("%s: mbuf %p needs TSO but missing header lengths",
45086af45170SJohn Baldwin 			__func__, m0));
45096af45170SJohn Baldwin 
45106af45170SJohn Baldwin 		ctrl = V_LSO_OPCODE(CPL_TX_PKT_LSO) | F_LSO_FIRST_SLICE |
45116af45170SJohn Baldwin 		    F_LSO_LAST_SLICE | V_LSO_IPHDR_LEN(m0->m_pkthdr.l3hlen >> 2)
45126af45170SJohn Baldwin 		    | V_LSO_TCPHDR_LEN(m0->m_pkthdr.l4hlen >> 2);
45136af45170SJohn Baldwin 		if (m0->m_pkthdr.l2hlen == sizeof(struct ether_vlan_header))
45146af45170SJohn Baldwin 			ctrl |= V_LSO_ETHHDR_LEN(1);
45156af45170SJohn Baldwin 		if (m0->m_pkthdr.l3hlen == sizeof(struct ip6_hdr))
45166af45170SJohn Baldwin 			ctrl |= F_LSO_IPV6;
45176af45170SJohn Baldwin 
45186af45170SJohn Baldwin 		lso->lso_ctrl = htobe32(ctrl);
45196af45170SJohn Baldwin 		lso->ipid_ofst = htobe16(0);
45206af45170SJohn Baldwin 		lso->mss = htobe16(m0->m_pkthdr.tso_segsz);
45216af45170SJohn Baldwin 		lso->seqno_offset = htobe32(0);
45226af45170SJohn Baldwin 		lso->len = htobe32(pktlen);
45236af45170SJohn Baldwin 
45246af45170SJohn Baldwin 		if (m0->m_pkthdr.l3hlen == sizeof(struct ip6_hdr))
45256af45170SJohn Baldwin 			csum_type = TX_CSUM_TCPIP6;
45266af45170SJohn Baldwin 		else
45276af45170SJohn Baldwin 			csum_type = TX_CSUM_TCPIP;
45286af45170SJohn Baldwin 
45296af45170SJohn Baldwin 		cpl = (void *)(lso + 1);
45306af45170SJohn Baldwin 
45316af45170SJohn Baldwin 		txq->tso_wrs++;
45326af45170SJohn Baldwin 	} else {
45336af45170SJohn Baldwin 		if (m0->m_pkthdr.csum_flags & CSUM_IP_TCP)
45346af45170SJohn Baldwin 			csum_type = TX_CSUM_TCPIP;
45356af45170SJohn Baldwin 		else if (m0->m_pkthdr.csum_flags & CSUM_IP_UDP)
45366af45170SJohn Baldwin 			csum_type = TX_CSUM_UDPIP;
45376af45170SJohn Baldwin 		else if (m0->m_pkthdr.csum_flags & CSUM_IP6_TCP)
45386af45170SJohn Baldwin 			csum_type = TX_CSUM_TCPIP6;
45396af45170SJohn Baldwin 		else if (m0->m_pkthdr.csum_flags & CSUM_IP6_UDP)
45406af45170SJohn Baldwin 			csum_type = TX_CSUM_UDPIP6;
45416af45170SJohn Baldwin #if defined(INET)
45426af45170SJohn Baldwin 		else if (m0->m_pkthdr.csum_flags & CSUM_IP) {
45436af45170SJohn Baldwin 			/*
45446af45170SJohn Baldwin 			 * XXX: The firmware appears to stomp on the
45456af45170SJohn Baldwin 			 * fragment/flags field of the IP header when
45466af45170SJohn Baldwin 			 * using TX_CSUM_IP.  Fall back to doing
45476af45170SJohn Baldwin 			 * software checksums.
45486af45170SJohn Baldwin 			 */
45496af45170SJohn Baldwin 			u_short *sump;
45506af45170SJohn Baldwin 			struct mbuf *m;
45516af45170SJohn Baldwin 			int offset;
45526af45170SJohn Baldwin 
45536af45170SJohn Baldwin 			m = m0;
45546af45170SJohn Baldwin 			offset = 0;
45556af45170SJohn Baldwin 			sump = m_advance(&m, &offset, m0->m_pkthdr.l2hlen +
45566af45170SJohn Baldwin 			    offsetof(struct ip, ip_sum));
45576af45170SJohn Baldwin 			*sump = in_cksum_skip(m0, m0->m_pkthdr.l2hlen +
45586af45170SJohn Baldwin 			    m0->m_pkthdr.l3hlen, m0->m_pkthdr.l2hlen);
45596af45170SJohn Baldwin 			m0->m_pkthdr.csum_flags &= ~CSUM_IP;
45606af45170SJohn Baldwin 		}
45616af45170SJohn Baldwin #endif
45626af45170SJohn Baldwin 
45636af45170SJohn Baldwin 		cpl = (void *)(wr + 1);
45646af45170SJohn Baldwin 	}
45656af45170SJohn Baldwin 
45666af45170SJohn Baldwin 	/* Checksum offload */
45676af45170SJohn Baldwin 	ctrl1 = 0;
45686af45170SJohn Baldwin 	if (needs_l3_csum(m0) == 0)
45696af45170SJohn Baldwin 		ctrl1 |= F_TXPKT_IPCSUM_DIS;
45706af45170SJohn Baldwin 	if (csum_type >= 0) {
45716af45170SJohn Baldwin 		KASSERT(m0->m_pkthdr.l2hlen > 0 && m0->m_pkthdr.l3hlen > 0,
45726af45170SJohn Baldwin 	    ("%s: mbuf %p needs checksum offload but missing header lengths",
45736af45170SJohn Baldwin 			__func__, m0));
45746af45170SJohn Baldwin 
4575472a6004SNavdeep Parhar 		if (chip_id(sc) <= CHELSIO_T5) {
45766af45170SJohn Baldwin 			ctrl1 |= V_TXPKT_ETHHDR_LEN(m0->m_pkthdr.l2hlen -
45776af45170SJohn Baldwin 			    ETHER_HDR_LEN);
4578472a6004SNavdeep Parhar 		} else {
4579472a6004SNavdeep Parhar 			ctrl1 |= V_T6_TXPKT_ETHHDR_LEN(m0->m_pkthdr.l2hlen -
4580472a6004SNavdeep Parhar 			    ETHER_HDR_LEN);
4581472a6004SNavdeep Parhar 		}
45826af45170SJohn Baldwin 		ctrl1 |= V_TXPKT_IPHDR_LEN(m0->m_pkthdr.l3hlen);
45836af45170SJohn Baldwin 		ctrl1 |= V_TXPKT_CSUM_TYPE(csum_type);
45846af45170SJohn Baldwin 	} else
45856af45170SJohn Baldwin 		ctrl1 |= F_TXPKT_L4CSUM_DIS;
45866af45170SJohn Baldwin 	if (m0->m_pkthdr.csum_flags & (CSUM_IP | CSUM_TCP | CSUM_UDP |
45876af45170SJohn Baldwin 	    CSUM_UDP_IPV6 | CSUM_TCP_IPV6 | CSUM_TSO))
45886af45170SJohn Baldwin 		txq->txcsum++;	/* some hardware assistance provided */
45896af45170SJohn Baldwin 
45906af45170SJohn Baldwin 	/* VLAN tag insertion */
45916af45170SJohn Baldwin 	if (needs_vlan_insertion(m0)) {
45926af45170SJohn Baldwin 		ctrl1 |= F_TXPKT_VLAN_VLD |
45936af45170SJohn Baldwin 		    V_TXPKT_VLAN(m0->m_pkthdr.ether_vtag);
45946af45170SJohn Baldwin 		txq->vlan_insertion++;
45956af45170SJohn Baldwin 	}
45966af45170SJohn Baldwin 
45976af45170SJohn Baldwin 	/* CPL header */
45986af45170SJohn Baldwin 	cpl->ctrl0 = txq->cpl_ctrl0;
45996af45170SJohn Baldwin 	cpl->pack = 0;
46006af45170SJohn Baldwin 	cpl->len = htobe16(pktlen);
46016af45170SJohn Baldwin 	cpl->ctrl1 = htobe64(ctrl1);
46026af45170SJohn Baldwin 
46036af45170SJohn Baldwin 	/* SGL */
46046af45170SJohn Baldwin 	dst = (void *)(cpl + 1);
46056af45170SJohn Baldwin 
46066af45170SJohn Baldwin 	/*
46076af45170SJohn Baldwin 	 * A packet using TSO will use up an entire descriptor for the
46086af45170SJohn Baldwin 	 * firmware work request header, LSO CPL, and TX_PKT_XT CPL.
46096af45170SJohn Baldwin 	 * If this descriptor is the last descriptor in the ring, wrap
46106af45170SJohn Baldwin 	 * around to the front of the ring explicitly for the start of
46116af45170SJohn Baldwin 	 * the sgl.
46126af45170SJohn Baldwin 	 */
46136af45170SJohn Baldwin 	if (dst == (void *)&eq->desc[eq->sidx]) {
46146af45170SJohn Baldwin 		dst = (void *)&eq->desc[0];
46156af45170SJohn Baldwin 		write_gl_to_txd(txq, m0, &dst, 0);
46166af45170SJohn Baldwin 	} else
46176af45170SJohn Baldwin 		write_gl_to_txd(txq, m0, &dst, eq->sidx - ndesc < eq->pidx);
46186af45170SJohn Baldwin 	txq->sgl_wrs++;
46196af45170SJohn Baldwin 
46206af45170SJohn Baldwin 	txq->txpkt_wrs++;
46216af45170SJohn Baldwin 
46226af45170SJohn Baldwin 	txsd = &txq->sdesc[eq->pidx];
46236af45170SJohn Baldwin 	txsd->m = m0;
46246af45170SJohn Baldwin 	txsd->desc_used = ndesc;
46256af45170SJohn Baldwin 
46266af45170SJohn Baldwin 	return (ndesc);
46276af45170SJohn Baldwin }
46286af45170SJohn Baldwin 
46296af45170SJohn Baldwin /*
4630*5cdaef71SJohn Baldwin  * Write a raw WR to the hardware descriptors, update the software
4631*5cdaef71SJohn Baldwin  * descriptor, and advance the pidx.  It is guaranteed that enough
4632*5cdaef71SJohn Baldwin  * descriptors are available.
4633*5cdaef71SJohn Baldwin  *
4634*5cdaef71SJohn Baldwin  * The return value is the # of hardware descriptors used.
4635*5cdaef71SJohn Baldwin  */
4636*5cdaef71SJohn Baldwin static u_int
4637*5cdaef71SJohn Baldwin write_raw_wr(struct sge_txq *txq, void *wr, struct mbuf *m0, u_int available)
4638*5cdaef71SJohn Baldwin {
4639*5cdaef71SJohn Baldwin 	struct sge_eq *eq = &txq->eq;
4640*5cdaef71SJohn Baldwin 	struct tx_sdesc *txsd;
4641*5cdaef71SJohn Baldwin 	struct mbuf *m;
4642*5cdaef71SJohn Baldwin 	caddr_t dst;
4643*5cdaef71SJohn Baldwin 	int len16, ndesc;
4644*5cdaef71SJohn Baldwin 
4645*5cdaef71SJohn Baldwin 	len16 = mbuf_len16(m0);
4646*5cdaef71SJohn Baldwin 	ndesc = howmany(len16, EQ_ESIZE / 16);
4647*5cdaef71SJohn Baldwin 	MPASS(ndesc <= available);
4648*5cdaef71SJohn Baldwin 
4649*5cdaef71SJohn Baldwin 	dst = wr;
4650*5cdaef71SJohn Baldwin 	for (m = m0; m != NULL; m = m->m_next)
4651*5cdaef71SJohn Baldwin 		copy_to_txd(eq, mtod(m, caddr_t), &dst, m->m_len);
4652*5cdaef71SJohn Baldwin 
4653*5cdaef71SJohn Baldwin 	txq->raw_wrs++;
4654*5cdaef71SJohn Baldwin 
4655*5cdaef71SJohn Baldwin 	txsd = &txq->sdesc[eq->pidx];
4656*5cdaef71SJohn Baldwin 	txsd->m = m0;
4657*5cdaef71SJohn Baldwin 	txsd->desc_used = ndesc;
4658*5cdaef71SJohn Baldwin 
4659*5cdaef71SJohn Baldwin 	return (ndesc);
4660*5cdaef71SJohn Baldwin }
4661*5cdaef71SJohn Baldwin 
4662*5cdaef71SJohn Baldwin /*
46637951040fSNavdeep Parhar  * Write a txpkt WR for this packet to the hardware descriptors, update the
46647951040fSNavdeep Parhar  * software descriptor, and advance the pidx.  It is guaranteed that enough
46657951040fSNavdeep Parhar  * descriptors are available.
466654e4ee71SNavdeep Parhar  *
46677951040fSNavdeep Parhar  * The return value is the # of hardware descriptors used.
466854e4ee71SNavdeep Parhar  */
46697951040fSNavdeep Parhar static u_int
46707951040fSNavdeep Parhar write_txpkt_wr(struct sge_txq *txq, struct fw_eth_tx_pkt_wr *wr,
46717951040fSNavdeep Parhar     struct mbuf *m0, u_int available)
467254e4ee71SNavdeep Parhar {
467354e4ee71SNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
46747951040fSNavdeep Parhar 	struct tx_sdesc *txsd;
467554e4ee71SNavdeep Parhar 	struct cpl_tx_pkt_core *cpl;
467654e4ee71SNavdeep Parhar 	uint32_t ctrl;	/* used in many unrelated places */
467754e4ee71SNavdeep Parhar 	uint64_t ctrl1;
46787951040fSNavdeep Parhar 	int len16, ndesc, pktlen, nsegs;
467954e4ee71SNavdeep Parhar 	caddr_t dst;
468054e4ee71SNavdeep Parhar 
468154e4ee71SNavdeep Parhar 	TXQ_LOCK_ASSERT_OWNED(txq);
46827951040fSNavdeep Parhar 	M_ASSERTPKTHDR(m0);
46837951040fSNavdeep Parhar 	MPASS(available > 0 && available < eq->sidx);
468454e4ee71SNavdeep Parhar 
46857951040fSNavdeep Parhar 	len16 = mbuf_len16(m0);
46867951040fSNavdeep Parhar 	nsegs = mbuf_nsegs(m0);
46877951040fSNavdeep Parhar 	pktlen = m0->m_pkthdr.len;
468854e4ee71SNavdeep Parhar 	ctrl = sizeof(struct cpl_tx_pkt_core);
46897951040fSNavdeep Parhar 	if (needs_tso(m0))
46902a5f6b0eSNavdeep Parhar 		ctrl += sizeof(struct cpl_tx_pkt_lso_core);
46917951040fSNavdeep Parhar 	else if (pktlen <= imm_payload(2) && available >= 2) {
46927951040fSNavdeep Parhar 		/* Immediate data.  Recalculate len16 and set nsegs to 0. */
4693ecb79ca4SNavdeep Parhar 		ctrl += pktlen;
46947951040fSNavdeep Parhar 		len16 = howmany(sizeof(struct fw_eth_tx_pkt_wr) +
46957951040fSNavdeep Parhar 		    sizeof(struct cpl_tx_pkt_core) + pktlen, 16);
46967951040fSNavdeep Parhar 		nsegs = 0;
469754e4ee71SNavdeep Parhar 	}
46987951040fSNavdeep Parhar 	ndesc = howmany(len16, EQ_ESIZE / 16);
46997951040fSNavdeep Parhar 	MPASS(ndesc <= available);
470054e4ee71SNavdeep Parhar 
470154e4ee71SNavdeep Parhar 	/* Firmware work request header */
47027951040fSNavdeep Parhar 	MPASS(wr == (void *)&eq->desc[eq->pidx]);
470354e4ee71SNavdeep Parhar 	wr->op_immdlen = htobe32(V_FW_WR_OP(FW_ETH_TX_PKT_WR) |
4704733b9277SNavdeep Parhar 	    V_FW_ETH_TX_PKT_WR_IMMDLEN(ctrl));
47056b49a4ecSNavdeep Parhar 
47067951040fSNavdeep Parhar 	ctrl = V_FW_WR_LEN16(len16);
470754e4ee71SNavdeep Parhar 	wr->equiq_to_len16 = htobe32(ctrl);
470854e4ee71SNavdeep Parhar 	wr->r3 = 0;
470954e4ee71SNavdeep Parhar 
47107951040fSNavdeep Parhar 	if (needs_tso(m0)) {
47112a5f6b0eSNavdeep Parhar 		struct cpl_tx_pkt_lso_core *lso = (void *)(wr + 1);
47127951040fSNavdeep Parhar 
47137951040fSNavdeep Parhar 		KASSERT(m0->m_pkthdr.l2hlen > 0 && m0->m_pkthdr.l3hlen > 0 &&
47147951040fSNavdeep Parhar 		    m0->m_pkthdr.l4hlen > 0,
47157951040fSNavdeep Parhar 		    ("%s: mbuf %p needs TSO but missing header lengths",
47167951040fSNavdeep Parhar 			__func__, m0));
471754e4ee71SNavdeep Parhar 
471854e4ee71SNavdeep Parhar 		ctrl = V_LSO_OPCODE(CPL_TX_PKT_LSO) | F_LSO_FIRST_SLICE |
47197951040fSNavdeep Parhar 		    F_LSO_LAST_SLICE | V_LSO_IPHDR_LEN(m0->m_pkthdr.l3hlen >> 2)
47207951040fSNavdeep Parhar 		    | V_LSO_TCPHDR_LEN(m0->m_pkthdr.l4hlen >> 2);
47217951040fSNavdeep Parhar 		if (m0->m_pkthdr.l2hlen == sizeof(struct ether_vlan_header))
472254e4ee71SNavdeep Parhar 			ctrl |= V_LSO_ETHHDR_LEN(1);
47237951040fSNavdeep Parhar 		if (m0->m_pkthdr.l3hlen == sizeof(struct ip6_hdr))
4724a1ea9a82SNavdeep Parhar 			ctrl |= F_LSO_IPV6;
472554e4ee71SNavdeep Parhar 
472654e4ee71SNavdeep Parhar 		lso->lso_ctrl = htobe32(ctrl);
472754e4ee71SNavdeep Parhar 		lso->ipid_ofst = htobe16(0);
47287951040fSNavdeep Parhar 		lso->mss = htobe16(m0->m_pkthdr.tso_segsz);
472954e4ee71SNavdeep Parhar 		lso->seqno_offset = htobe32(0);
4730ecb79ca4SNavdeep Parhar 		lso->len = htobe32(pktlen);
473154e4ee71SNavdeep Parhar 
473254e4ee71SNavdeep Parhar 		cpl = (void *)(lso + 1);
473354e4ee71SNavdeep Parhar 
473454e4ee71SNavdeep Parhar 		txq->tso_wrs++;
473554e4ee71SNavdeep Parhar 	} else
473654e4ee71SNavdeep Parhar 		cpl = (void *)(wr + 1);
473754e4ee71SNavdeep Parhar 
473854e4ee71SNavdeep Parhar 	/* Checksum offload */
473954e4ee71SNavdeep Parhar 	ctrl1 = 0;
47407951040fSNavdeep Parhar 	if (needs_l3_csum(m0) == 0)
474154e4ee71SNavdeep Parhar 		ctrl1 |= F_TXPKT_IPCSUM_DIS;
47427951040fSNavdeep Parhar 	if (needs_l4_csum(m0) == 0)
474354e4ee71SNavdeep Parhar 		ctrl1 |= F_TXPKT_L4CSUM_DIS;
47447951040fSNavdeep Parhar 	if (m0->m_pkthdr.csum_flags & (CSUM_IP | CSUM_TCP | CSUM_UDP |
4745b8531380SNavdeep Parhar 	    CSUM_UDP_IPV6 | CSUM_TCP_IPV6 | CSUM_TSO))
474654e4ee71SNavdeep Parhar 		txq->txcsum++;	/* some hardware assistance provided */
474754e4ee71SNavdeep Parhar 
474854e4ee71SNavdeep Parhar 	/* VLAN tag insertion */
47497951040fSNavdeep Parhar 	if (needs_vlan_insertion(m0)) {
47507951040fSNavdeep Parhar 		ctrl1 |= F_TXPKT_VLAN_VLD | V_TXPKT_VLAN(m0->m_pkthdr.ether_vtag);
475154e4ee71SNavdeep Parhar 		txq->vlan_insertion++;
475254e4ee71SNavdeep Parhar 	}
475354e4ee71SNavdeep Parhar 
475454e4ee71SNavdeep Parhar 	/* CPL header */
47557951040fSNavdeep Parhar 	cpl->ctrl0 = txq->cpl_ctrl0;
475654e4ee71SNavdeep Parhar 	cpl->pack = 0;
4757ecb79ca4SNavdeep Parhar 	cpl->len = htobe16(pktlen);
475854e4ee71SNavdeep Parhar 	cpl->ctrl1 = htobe64(ctrl1);
475954e4ee71SNavdeep Parhar 
476054e4ee71SNavdeep Parhar 	/* SGL */
476154e4ee71SNavdeep Parhar 	dst = (void *)(cpl + 1);
47627951040fSNavdeep Parhar 	if (nsegs > 0) {
47637951040fSNavdeep Parhar 
47647951040fSNavdeep Parhar 		write_gl_to_txd(txq, m0, &dst, eq->sidx - ndesc < eq->pidx);
476554e4ee71SNavdeep Parhar 		txq->sgl_wrs++;
476654e4ee71SNavdeep Parhar 	} else {
47677951040fSNavdeep Parhar 		struct mbuf *m;
47687951040fSNavdeep Parhar 
47697951040fSNavdeep Parhar 		for (m = m0; m != NULL; m = m->m_next) {
477054e4ee71SNavdeep Parhar 			copy_to_txd(eq, mtod(m, caddr_t), &dst, m->m_len);
4771ecb79ca4SNavdeep Parhar #ifdef INVARIANTS
4772ecb79ca4SNavdeep Parhar 			pktlen -= m->m_len;
4773ecb79ca4SNavdeep Parhar #endif
477454e4ee71SNavdeep Parhar 		}
4775ecb79ca4SNavdeep Parhar #ifdef INVARIANTS
4776ecb79ca4SNavdeep Parhar 		KASSERT(pktlen == 0, ("%s: %d bytes left.", __func__, pktlen));
4777ecb79ca4SNavdeep Parhar #endif
47787951040fSNavdeep Parhar 		txq->imm_wrs++;
477954e4ee71SNavdeep Parhar 	}
478054e4ee71SNavdeep Parhar 
478154e4ee71SNavdeep Parhar 	txq->txpkt_wrs++;
478254e4ee71SNavdeep Parhar 
4783f7dfe243SNavdeep Parhar 	txsd = &txq->sdesc[eq->pidx];
47847951040fSNavdeep Parhar 	txsd->m = m0;
478554e4ee71SNavdeep Parhar 	txsd->desc_used = ndesc;
478654e4ee71SNavdeep Parhar 
47877951040fSNavdeep Parhar 	return (ndesc);
478854e4ee71SNavdeep Parhar }
478954e4ee71SNavdeep Parhar 
47907951040fSNavdeep Parhar static int
47917951040fSNavdeep Parhar try_txpkts(struct mbuf *m, struct mbuf *n, struct txpkts *txp, u_int available)
479254e4ee71SNavdeep Parhar {
47937951040fSNavdeep Parhar 	u_int needed, nsegs1, nsegs2, l1, l2;
47947951040fSNavdeep Parhar 
47957951040fSNavdeep Parhar 	if (cannot_use_txpkts(m) || cannot_use_txpkts(n))
47967951040fSNavdeep Parhar 		return (1);
47977951040fSNavdeep Parhar 
47987951040fSNavdeep Parhar 	nsegs1 = mbuf_nsegs(m);
47997951040fSNavdeep Parhar 	nsegs2 = mbuf_nsegs(n);
48007951040fSNavdeep Parhar 	if (nsegs1 + nsegs2 == 2) {
48017951040fSNavdeep Parhar 		txp->wr_type = 1;
48027951040fSNavdeep Parhar 		l1 = l2 = txpkts1_len16();
48037951040fSNavdeep Parhar 	} else {
48047951040fSNavdeep Parhar 		txp->wr_type = 0;
48057951040fSNavdeep Parhar 		l1 = txpkts0_len16(nsegs1);
48067951040fSNavdeep Parhar 		l2 = txpkts0_len16(nsegs2);
48077951040fSNavdeep Parhar 	}
48087951040fSNavdeep Parhar 	txp->len16 = howmany(sizeof(struct fw_eth_tx_pkts_wr), 16) + l1 + l2;
48097951040fSNavdeep Parhar 	needed = howmany(txp->len16, EQ_ESIZE / 16);
48107951040fSNavdeep Parhar 	if (needed > SGE_MAX_WR_NDESC || needed > available)
48117951040fSNavdeep Parhar 		return (1);
48127951040fSNavdeep Parhar 
48137951040fSNavdeep Parhar 	txp->plen = m->m_pkthdr.len + n->m_pkthdr.len;
48147951040fSNavdeep Parhar 	if (txp->plen > 65535)
48157951040fSNavdeep Parhar 		return (1);
48167951040fSNavdeep Parhar 
48177951040fSNavdeep Parhar 	txp->npkt = 2;
48187951040fSNavdeep Parhar 	set_mbuf_len16(m, l1);
48197951040fSNavdeep Parhar 	set_mbuf_len16(n, l2);
48207951040fSNavdeep Parhar 
48217951040fSNavdeep Parhar 	return (0);
48227951040fSNavdeep Parhar }
48237951040fSNavdeep Parhar 
48247951040fSNavdeep Parhar static int
48257951040fSNavdeep Parhar add_to_txpkts(struct mbuf *m, struct txpkts *txp, u_int available)
48267951040fSNavdeep Parhar {
48277951040fSNavdeep Parhar 	u_int plen, len16, needed, nsegs;
48287951040fSNavdeep Parhar 
48297951040fSNavdeep Parhar 	MPASS(txp->wr_type == 0 || txp->wr_type == 1);
48307951040fSNavdeep Parhar 
48317890b5c1SJohn Baldwin 	if (cannot_use_txpkts(m))
48327890b5c1SJohn Baldwin 		return (1);
48337890b5c1SJohn Baldwin 
48347951040fSNavdeep Parhar 	nsegs = mbuf_nsegs(m);
48357890b5c1SJohn Baldwin 	if (txp->wr_type == 1 && nsegs != 1)
48367951040fSNavdeep Parhar 		return (1);
48377951040fSNavdeep Parhar 
48387951040fSNavdeep Parhar 	plen = txp->plen + m->m_pkthdr.len;
48397951040fSNavdeep Parhar 	if (plen > 65535)
48407951040fSNavdeep Parhar 		return (1);
48417951040fSNavdeep Parhar 
48427951040fSNavdeep Parhar 	if (txp->wr_type == 0)
48437951040fSNavdeep Parhar 		len16 = txpkts0_len16(nsegs);
48447951040fSNavdeep Parhar 	else
48457951040fSNavdeep Parhar 		len16 = txpkts1_len16();
48467951040fSNavdeep Parhar 	needed = howmany(txp->len16 + len16, EQ_ESIZE / 16);
48477951040fSNavdeep Parhar 	if (needed > SGE_MAX_WR_NDESC || needed > available)
48487951040fSNavdeep Parhar 		return (1);
48497951040fSNavdeep Parhar 
48507951040fSNavdeep Parhar 	txp->npkt++;
48517951040fSNavdeep Parhar 	txp->plen = plen;
48527951040fSNavdeep Parhar 	txp->len16 += len16;
48537951040fSNavdeep Parhar 	set_mbuf_len16(m, len16);
48547951040fSNavdeep Parhar 
48557951040fSNavdeep Parhar 	return (0);
48567951040fSNavdeep Parhar }
48577951040fSNavdeep Parhar 
48587951040fSNavdeep Parhar /*
48597951040fSNavdeep Parhar  * Write a txpkts WR for the packets in txp to the hardware descriptors, update
48607951040fSNavdeep Parhar  * the software descriptor, and advance the pidx.  It is guaranteed that enough
48617951040fSNavdeep Parhar  * descriptors are available.
48627951040fSNavdeep Parhar  *
48637951040fSNavdeep Parhar  * The return value is the # of hardware descriptors used.
48647951040fSNavdeep Parhar  */
48657951040fSNavdeep Parhar static u_int
48667951040fSNavdeep Parhar write_txpkts_wr(struct sge_txq *txq, struct fw_eth_tx_pkts_wr *wr,
48677951040fSNavdeep Parhar     struct mbuf *m0, const struct txpkts *txp, u_int available)
48687951040fSNavdeep Parhar {
48697951040fSNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
48707951040fSNavdeep Parhar 	struct tx_sdesc *txsd;
48717951040fSNavdeep Parhar 	struct cpl_tx_pkt_core *cpl;
48727951040fSNavdeep Parhar 	uint32_t ctrl;
48737951040fSNavdeep Parhar 	uint64_t ctrl1;
48747951040fSNavdeep Parhar 	int ndesc, checkwrap;
48757951040fSNavdeep Parhar 	struct mbuf *m;
48767951040fSNavdeep Parhar 	void *flitp;
48777951040fSNavdeep Parhar 
48787951040fSNavdeep Parhar 	TXQ_LOCK_ASSERT_OWNED(txq);
48797951040fSNavdeep Parhar 	MPASS(txp->npkt > 0);
48807951040fSNavdeep Parhar 	MPASS(txp->plen < 65536);
48817951040fSNavdeep Parhar 	MPASS(m0 != NULL);
48827951040fSNavdeep Parhar 	MPASS(m0->m_nextpkt != NULL);
48837951040fSNavdeep Parhar 	MPASS(txp->len16 <= howmany(SGE_MAX_WR_LEN, 16));
48847951040fSNavdeep Parhar 	MPASS(available > 0 && available < eq->sidx);
48857951040fSNavdeep Parhar 
48867951040fSNavdeep Parhar 	ndesc = howmany(txp->len16, EQ_ESIZE / 16);
48877951040fSNavdeep Parhar 	MPASS(ndesc <= available);
48887951040fSNavdeep Parhar 
48897951040fSNavdeep Parhar 	MPASS(wr == (void *)&eq->desc[eq->pidx]);
48907951040fSNavdeep Parhar 	wr->op_pkd = htobe32(V_FW_WR_OP(FW_ETH_TX_PKTS_WR));
48917951040fSNavdeep Parhar 	ctrl = V_FW_WR_LEN16(txp->len16);
48927951040fSNavdeep Parhar 	wr->equiq_to_len16 = htobe32(ctrl);
48937951040fSNavdeep Parhar 	wr->plen = htobe16(txp->plen);
48947951040fSNavdeep Parhar 	wr->npkt = txp->npkt;
48957951040fSNavdeep Parhar 	wr->r3 = 0;
48967951040fSNavdeep Parhar 	wr->type = txp->wr_type;
48977951040fSNavdeep Parhar 	flitp = wr + 1;
48987951040fSNavdeep Parhar 
48997951040fSNavdeep Parhar 	/*
49007951040fSNavdeep Parhar 	 * At this point we are 16B into a hardware descriptor.  If checkwrap is
49017951040fSNavdeep Parhar 	 * set then we know the WR is going to wrap around somewhere.  We'll
49027951040fSNavdeep Parhar 	 * check for that at appropriate points.
49037951040fSNavdeep Parhar 	 */
49047951040fSNavdeep Parhar 	checkwrap = eq->sidx - ndesc < eq->pidx;
49057951040fSNavdeep Parhar 	for (m = m0; m != NULL; m = m->m_nextpkt) {
49067951040fSNavdeep Parhar 		if (txp->wr_type == 0) {
490754e4ee71SNavdeep Parhar 			struct ulp_txpkt *ulpmc;
490854e4ee71SNavdeep Parhar 			struct ulptx_idata *ulpsc;
490954e4ee71SNavdeep Parhar 
49107951040fSNavdeep Parhar 			/* ULP master command */
49117951040fSNavdeep Parhar 			ulpmc = flitp;
49127951040fSNavdeep Parhar 			ulpmc->cmd_dest = htobe32(V_ULPTX_CMD(ULP_TX_PKT) |
49137951040fSNavdeep Parhar 			    V_ULP_TXPKT_DEST(0) | V_ULP_TXPKT_FID(eq->iqid));
49147951040fSNavdeep Parhar 			ulpmc->len = htobe32(mbuf_len16(m));
491554e4ee71SNavdeep Parhar 
49167951040fSNavdeep Parhar 			/* ULP subcommand */
49177951040fSNavdeep Parhar 			ulpsc = (void *)(ulpmc + 1);
49187951040fSNavdeep Parhar 			ulpsc->cmd_more = htobe32(V_ULPTX_CMD(ULP_TX_SC_IMM) |
49197951040fSNavdeep Parhar 			    F_ULP_TX_SC_MORE);
49207951040fSNavdeep Parhar 			ulpsc->len = htobe32(sizeof(struct cpl_tx_pkt_core));
49217951040fSNavdeep Parhar 
49227951040fSNavdeep Parhar 			cpl = (void *)(ulpsc + 1);
49237951040fSNavdeep Parhar 			if (checkwrap &&
49247951040fSNavdeep Parhar 			    (uintptr_t)cpl == (uintptr_t)&eq->desc[eq->sidx])
49257951040fSNavdeep Parhar 				cpl = (void *)&eq->desc[0];
49267951040fSNavdeep Parhar 		} else {
49277951040fSNavdeep Parhar 			cpl = flitp;
49287951040fSNavdeep Parhar 		}
492954e4ee71SNavdeep Parhar 
493054e4ee71SNavdeep Parhar 		/* Checksum offload */
49317951040fSNavdeep Parhar 		ctrl1 = 0;
49327951040fSNavdeep Parhar 		if (needs_l3_csum(m) == 0)
49337951040fSNavdeep Parhar 			ctrl1 |= F_TXPKT_IPCSUM_DIS;
49347951040fSNavdeep Parhar 		if (needs_l4_csum(m) == 0)
49357951040fSNavdeep Parhar 			ctrl1 |= F_TXPKT_L4CSUM_DIS;
4936b8531380SNavdeep Parhar 		if (m->m_pkthdr.csum_flags & (CSUM_IP | CSUM_TCP | CSUM_UDP |
4937b8531380SNavdeep Parhar 		    CSUM_UDP_IPV6 | CSUM_TCP_IPV6 | CSUM_TSO))
493854e4ee71SNavdeep Parhar 			txq->txcsum++;	/* some hardware assistance provided */
493954e4ee71SNavdeep Parhar 
494054e4ee71SNavdeep Parhar 		/* VLAN tag insertion */
49417951040fSNavdeep Parhar 		if (needs_vlan_insertion(m)) {
49427951040fSNavdeep Parhar 			ctrl1 |= F_TXPKT_VLAN_VLD |
49437951040fSNavdeep Parhar 			    V_TXPKT_VLAN(m->m_pkthdr.ether_vtag);
494454e4ee71SNavdeep Parhar 			txq->vlan_insertion++;
494554e4ee71SNavdeep Parhar 		}
494654e4ee71SNavdeep Parhar 
49477951040fSNavdeep Parhar 		/* CPL header */
49487951040fSNavdeep Parhar 		cpl->ctrl0 = txq->cpl_ctrl0;
494954e4ee71SNavdeep Parhar 		cpl->pack = 0;
495054e4ee71SNavdeep Parhar 		cpl->len = htobe16(m->m_pkthdr.len);
49517951040fSNavdeep Parhar 		cpl->ctrl1 = htobe64(ctrl1);
495254e4ee71SNavdeep Parhar 
49537951040fSNavdeep Parhar 		flitp = cpl + 1;
49547951040fSNavdeep Parhar 		if (checkwrap &&
49557951040fSNavdeep Parhar 		    (uintptr_t)flitp == (uintptr_t)&eq->desc[eq->sidx])
49567951040fSNavdeep Parhar 			flitp = (void *)&eq->desc[0];
495754e4ee71SNavdeep Parhar 
49587951040fSNavdeep Parhar 		write_gl_to_txd(txq, m, (caddr_t *)(&flitp), checkwrap);
495954e4ee71SNavdeep Parhar 
49607951040fSNavdeep Parhar 	}
49617951040fSNavdeep Parhar 
4962a59a1477SNavdeep Parhar 	if (txp->wr_type == 0) {
4963a59a1477SNavdeep Parhar 		txq->txpkts0_pkts += txp->npkt;
4964a59a1477SNavdeep Parhar 		txq->txpkts0_wrs++;
4965a59a1477SNavdeep Parhar 	} else {
4966a59a1477SNavdeep Parhar 		txq->txpkts1_pkts += txp->npkt;
4967a59a1477SNavdeep Parhar 		txq->txpkts1_wrs++;
4968a59a1477SNavdeep Parhar 	}
4969a59a1477SNavdeep Parhar 
49707951040fSNavdeep Parhar 	txsd = &txq->sdesc[eq->pidx];
49717951040fSNavdeep Parhar 	txsd->m = m0;
49727951040fSNavdeep Parhar 	txsd->desc_used = ndesc;
49737951040fSNavdeep Parhar 
49747951040fSNavdeep Parhar 	return (ndesc);
497554e4ee71SNavdeep Parhar }
497654e4ee71SNavdeep Parhar 
497754e4ee71SNavdeep Parhar /*
497854e4ee71SNavdeep Parhar  * If the SGL ends on an address that is not 16 byte aligned, this function will
49797951040fSNavdeep Parhar  * add a 0 filled flit at the end.
498054e4ee71SNavdeep Parhar  */
49817951040fSNavdeep Parhar static void
49827951040fSNavdeep Parhar write_gl_to_txd(struct sge_txq *txq, struct mbuf *m, caddr_t *to, int checkwrap)
498354e4ee71SNavdeep Parhar {
49847951040fSNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
49857951040fSNavdeep Parhar 	struct sglist *gl = txq->gl;
49867951040fSNavdeep Parhar 	struct sglist_seg *seg;
49877951040fSNavdeep Parhar 	__be64 *flitp, *wrap;
498854e4ee71SNavdeep Parhar 	struct ulptx_sgl *usgl;
49897951040fSNavdeep Parhar 	int i, nflits, nsegs;
499054e4ee71SNavdeep Parhar 
499154e4ee71SNavdeep Parhar 	KASSERT(((uintptr_t)(*to) & 0xf) == 0,
499254e4ee71SNavdeep Parhar 	    ("%s: SGL must start at a 16 byte boundary: %p", __func__, *to));
49937951040fSNavdeep Parhar 	MPASS((uintptr_t)(*to) >= (uintptr_t)&eq->desc[0]);
49947951040fSNavdeep Parhar 	MPASS((uintptr_t)(*to) < (uintptr_t)&eq->desc[eq->sidx]);
499554e4ee71SNavdeep Parhar 
49967951040fSNavdeep Parhar 	get_pkt_gl(m, gl);
49977951040fSNavdeep Parhar 	nsegs = gl->sg_nseg;
49987951040fSNavdeep Parhar 	MPASS(nsegs > 0);
49997951040fSNavdeep Parhar 
50007951040fSNavdeep Parhar 	nflits = (3 * (nsegs - 1)) / 2 + ((nsegs - 1) & 1) + 2;
500154e4ee71SNavdeep Parhar 	flitp = (__be64 *)(*to);
50027951040fSNavdeep Parhar 	wrap = (__be64 *)(&eq->desc[eq->sidx]);
50037951040fSNavdeep Parhar 	seg = &gl->sg_segs[0];
500454e4ee71SNavdeep Parhar 	usgl = (void *)flitp;
500554e4ee71SNavdeep Parhar 
500654e4ee71SNavdeep Parhar 	/*
500754e4ee71SNavdeep Parhar 	 * We start at a 16 byte boundary somewhere inside the tx descriptor
500854e4ee71SNavdeep Parhar 	 * ring, so we're at least 16 bytes away from the status page.  There is
500954e4ee71SNavdeep Parhar 	 * no chance of a wrap around in the middle of usgl (which is 16 bytes).
501054e4ee71SNavdeep Parhar 	 */
501154e4ee71SNavdeep Parhar 
501254e4ee71SNavdeep Parhar 	usgl->cmd_nsge = htobe32(V_ULPTX_CMD(ULP_TX_SC_DSGL) |
50137951040fSNavdeep Parhar 	    V_ULPTX_NSGE(nsegs));
50147951040fSNavdeep Parhar 	usgl->len0 = htobe32(seg->ss_len);
50157951040fSNavdeep Parhar 	usgl->addr0 = htobe64(seg->ss_paddr);
501654e4ee71SNavdeep Parhar 	seg++;
501754e4ee71SNavdeep Parhar 
50187951040fSNavdeep Parhar 	if (checkwrap == 0 || (uintptr_t)(flitp + nflits) <= (uintptr_t)wrap) {
501954e4ee71SNavdeep Parhar 
502054e4ee71SNavdeep Parhar 		/* Won't wrap around at all */
502154e4ee71SNavdeep Parhar 
50227951040fSNavdeep Parhar 		for (i = 0; i < nsegs - 1; i++, seg++) {
50237951040fSNavdeep Parhar 			usgl->sge[i / 2].len[i & 1] = htobe32(seg->ss_len);
50247951040fSNavdeep Parhar 			usgl->sge[i / 2].addr[i & 1] = htobe64(seg->ss_paddr);
502554e4ee71SNavdeep Parhar 		}
502654e4ee71SNavdeep Parhar 		if (i & 1)
502754e4ee71SNavdeep Parhar 			usgl->sge[i / 2].len[1] = htobe32(0);
50287951040fSNavdeep Parhar 		flitp += nflits;
502954e4ee71SNavdeep Parhar 	} else {
503054e4ee71SNavdeep Parhar 
503154e4ee71SNavdeep Parhar 		/* Will wrap somewhere in the rest of the SGL */
503254e4ee71SNavdeep Parhar 
503354e4ee71SNavdeep Parhar 		/* 2 flits already written, write the rest flit by flit */
503454e4ee71SNavdeep Parhar 		flitp = (void *)(usgl + 1);
50357951040fSNavdeep Parhar 		for (i = 0; i < nflits - 2; i++) {
50367951040fSNavdeep Parhar 			if (flitp == wrap)
503754e4ee71SNavdeep Parhar 				flitp = (void *)eq->desc;
50387951040fSNavdeep Parhar 			*flitp++ = get_flit(seg, nsegs - 1, i);
503954e4ee71SNavdeep Parhar 		}
504054e4ee71SNavdeep Parhar 	}
504154e4ee71SNavdeep Parhar 
50427951040fSNavdeep Parhar 	if (nflits & 1) {
50437951040fSNavdeep Parhar 		MPASS(((uintptr_t)flitp) & 0xf);
50447951040fSNavdeep Parhar 		*flitp++ = 0;
50457951040fSNavdeep Parhar 	}
504654e4ee71SNavdeep Parhar 
50477951040fSNavdeep Parhar 	MPASS((((uintptr_t)flitp) & 0xf) == 0);
50487951040fSNavdeep Parhar 	if (__predict_false(flitp == wrap))
504954e4ee71SNavdeep Parhar 		*to = (void *)eq->desc;
505054e4ee71SNavdeep Parhar 	else
50517951040fSNavdeep Parhar 		*to = (void *)flitp;
505254e4ee71SNavdeep Parhar }
505354e4ee71SNavdeep Parhar 
505454e4ee71SNavdeep Parhar static inline void
505554e4ee71SNavdeep Parhar copy_to_txd(struct sge_eq *eq, caddr_t from, caddr_t *to, int len)
505654e4ee71SNavdeep Parhar {
50577951040fSNavdeep Parhar 
50587951040fSNavdeep Parhar 	MPASS((uintptr_t)(*to) >= (uintptr_t)&eq->desc[0]);
50597951040fSNavdeep Parhar 	MPASS((uintptr_t)(*to) < (uintptr_t)&eq->desc[eq->sidx]);
50607951040fSNavdeep Parhar 
50617951040fSNavdeep Parhar 	if (__predict_true((uintptr_t)(*to) + len <=
50627951040fSNavdeep Parhar 	    (uintptr_t)&eq->desc[eq->sidx])) {
506354e4ee71SNavdeep Parhar 		bcopy(from, *to, len);
506454e4ee71SNavdeep Parhar 		(*to) += len;
506554e4ee71SNavdeep Parhar 	} else {
50667951040fSNavdeep Parhar 		int portion = (uintptr_t)&eq->desc[eq->sidx] - (uintptr_t)(*to);
506754e4ee71SNavdeep Parhar 
506854e4ee71SNavdeep Parhar 		bcopy(from, *to, portion);
506954e4ee71SNavdeep Parhar 		from += portion;
507054e4ee71SNavdeep Parhar 		portion = len - portion;	/* remaining */
507154e4ee71SNavdeep Parhar 		bcopy(from, (void *)eq->desc, portion);
507254e4ee71SNavdeep Parhar 		(*to) = (caddr_t)eq->desc + portion;
507354e4ee71SNavdeep Parhar 	}
507454e4ee71SNavdeep Parhar }
507554e4ee71SNavdeep Parhar 
507654e4ee71SNavdeep Parhar static inline void
50777951040fSNavdeep Parhar ring_eq_db(struct adapter *sc, struct sge_eq *eq, u_int n)
507854e4ee71SNavdeep Parhar {
50797951040fSNavdeep Parhar 	u_int db;
50807951040fSNavdeep Parhar 
50817951040fSNavdeep Parhar 	MPASS(n > 0);
5082d14b0ac1SNavdeep Parhar 
5083d14b0ac1SNavdeep Parhar 	db = eq->doorbells;
50847951040fSNavdeep Parhar 	if (n > 1)
508577ad3c41SNavdeep Parhar 		clrbit(&db, DOORBELL_WCWR);
5086d14b0ac1SNavdeep Parhar 	wmb();
5087d14b0ac1SNavdeep Parhar 
5088d14b0ac1SNavdeep Parhar 	switch (ffs(db) - 1) {
5089d14b0ac1SNavdeep Parhar 	case DOORBELL_UDB:
50907951040fSNavdeep Parhar 		*eq->udb = htole32(V_QID(eq->udb_qid) | V_PIDX(n));
50917951040fSNavdeep Parhar 		break;
5092d14b0ac1SNavdeep Parhar 
509377ad3c41SNavdeep Parhar 	case DOORBELL_WCWR: {
5094d14b0ac1SNavdeep Parhar 		volatile uint64_t *dst, *src;
5095d14b0ac1SNavdeep Parhar 		int i;
5096d14b0ac1SNavdeep Parhar 
5097d14b0ac1SNavdeep Parhar 		/*
5098d14b0ac1SNavdeep Parhar 		 * Queues whose 128B doorbell segment fits in the page do not
5099d14b0ac1SNavdeep Parhar 		 * use relative qid (udb_qid is always 0).  Only queues with
510077ad3c41SNavdeep Parhar 		 * doorbell segments can do WCWR.
5101d14b0ac1SNavdeep Parhar 		 */
51027951040fSNavdeep Parhar 		KASSERT(eq->udb_qid == 0 && n == 1,
5103d14b0ac1SNavdeep Parhar 		    ("%s: inappropriate doorbell (0x%x, %d, %d) for eq %p",
51047951040fSNavdeep Parhar 		    __func__, eq->doorbells, n, eq->dbidx, eq));
5105d14b0ac1SNavdeep Parhar 
5106d14b0ac1SNavdeep Parhar 		dst = (volatile void *)((uintptr_t)eq->udb + UDBS_WR_OFFSET -
5107d14b0ac1SNavdeep Parhar 		    UDBS_DB_OFFSET);
51087951040fSNavdeep Parhar 		i = eq->dbidx;
5109d14b0ac1SNavdeep Parhar 		src = (void *)&eq->desc[i];
5110d14b0ac1SNavdeep Parhar 		while (src != (void *)&eq->desc[i + 1])
5111d14b0ac1SNavdeep Parhar 			*dst++ = *src++;
5112d14b0ac1SNavdeep Parhar 		wmb();
51137951040fSNavdeep Parhar 		break;
5114d14b0ac1SNavdeep Parhar 	}
5115d14b0ac1SNavdeep Parhar 
5116d14b0ac1SNavdeep Parhar 	case DOORBELL_UDBWC:
51177951040fSNavdeep Parhar 		*eq->udb = htole32(V_QID(eq->udb_qid) | V_PIDX(n));
5118d14b0ac1SNavdeep Parhar 		wmb();
51197951040fSNavdeep Parhar 		break;
5120d14b0ac1SNavdeep Parhar 
5121d14b0ac1SNavdeep Parhar 	case DOORBELL_KDB:
5122315048f2SJohn Baldwin 		t4_write_reg(sc, sc->sge_kdoorbell_reg,
51237951040fSNavdeep Parhar 		    V_QID(eq->cntxt_id) | V_PIDX(n));
51247951040fSNavdeep Parhar 		break;
512554e4ee71SNavdeep Parhar 	}
512654e4ee71SNavdeep Parhar 
51277951040fSNavdeep Parhar 	IDXINCR(eq->dbidx, n, eq->sidx);
51287951040fSNavdeep Parhar }
51297951040fSNavdeep Parhar 
51307951040fSNavdeep Parhar static inline u_int
51317951040fSNavdeep Parhar reclaimable_tx_desc(struct sge_eq *eq)
513254e4ee71SNavdeep Parhar {
51337951040fSNavdeep Parhar 	uint16_t hw_cidx;
513454e4ee71SNavdeep Parhar 
51357951040fSNavdeep Parhar 	hw_cidx = read_hw_cidx(eq);
51367951040fSNavdeep Parhar 	return (IDXDIFF(hw_cidx, eq->cidx, eq->sidx));
51377951040fSNavdeep Parhar }
513854e4ee71SNavdeep Parhar 
51397951040fSNavdeep Parhar static inline u_int
51407951040fSNavdeep Parhar total_available_tx_desc(struct sge_eq *eq)
51417951040fSNavdeep Parhar {
51427951040fSNavdeep Parhar 	uint16_t hw_cidx, pidx;
51437951040fSNavdeep Parhar 
51447951040fSNavdeep Parhar 	hw_cidx = read_hw_cidx(eq);
51457951040fSNavdeep Parhar 	pidx = eq->pidx;
51467951040fSNavdeep Parhar 
51477951040fSNavdeep Parhar 	if (pidx == hw_cidx)
51487951040fSNavdeep Parhar 		return (eq->sidx - 1);
514954e4ee71SNavdeep Parhar 	else
51507951040fSNavdeep Parhar 		return (IDXDIFF(hw_cidx, pidx, eq->sidx) - 1);
51517951040fSNavdeep Parhar }
51527951040fSNavdeep Parhar 
51537951040fSNavdeep Parhar static inline uint16_t
51547951040fSNavdeep Parhar read_hw_cidx(struct sge_eq *eq)
51557951040fSNavdeep Parhar {
51567951040fSNavdeep Parhar 	struct sge_qstat *spg = (void *)&eq->desc[eq->sidx];
51577951040fSNavdeep Parhar 	uint16_t cidx = spg->cidx;	/* stable snapshot */
51587951040fSNavdeep Parhar 
51597951040fSNavdeep Parhar 	return (be16toh(cidx));
5160e874ff7aSNavdeep Parhar }
516154e4ee71SNavdeep Parhar 
5162e874ff7aSNavdeep Parhar /*
51637951040fSNavdeep Parhar  * Reclaim 'n' descriptors approximately.
5164e874ff7aSNavdeep Parhar  */
51657951040fSNavdeep Parhar static u_int
51667951040fSNavdeep Parhar reclaim_tx_descs(struct sge_txq *txq, u_int n)
5167e874ff7aSNavdeep Parhar {
5168e874ff7aSNavdeep Parhar 	struct tx_sdesc *txsd;
5169f7dfe243SNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
51707951040fSNavdeep Parhar 	u_int can_reclaim, reclaimed;
517154e4ee71SNavdeep Parhar 
5172733b9277SNavdeep Parhar 	TXQ_LOCK_ASSERT_OWNED(txq);
51737951040fSNavdeep Parhar 	MPASS(n > 0);
5174e874ff7aSNavdeep Parhar 
51757951040fSNavdeep Parhar 	reclaimed = 0;
51767951040fSNavdeep Parhar 	can_reclaim = reclaimable_tx_desc(eq);
51777951040fSNavdeep Parhar 	while (can_reclaim && reclaimed < n) {
517854e4ee71SNavdeep Parhar 		int ndesc;
51797951040fSNavdeep Parhar 		struct mbuf *m, *nextpkt;
518054e4ee71SNavdeep Parhar 
5181f7dfe243SNavdeep Parhar 		txsd = &txq->sdesc[eq->cidx];
518254e4ee71SNavdeep Parhar 		ndesc = txsd->desc_used;
518354e4ee71SNavdeep Parhar 
518454e4ee71SNavdeep Parhar 		/* Firmware doesn't return "partial" credits. */
518554e4ee71SNavdeep Parhar 		KASSERT(can_reclaim >= ndesc,
518654e4ee71SNavdeep Parhar 		    ("%s: unexpected number of credits: %d, %d",
518754e4ee71SNavdeep Parhar 		    __func__, can_reclaim, ndesc));
5188dcd50a20SJohn Baldwin 		KASSERT(ndesc != 0,
5189dcd50a20SJohn Baldwin 		    ("%s: descriptor with no credits: cidx %d",
5190dcd50a20SJohn Baldwin 		    __func__, eq->cidx));
519154e4ee71SNavdeep Parhar 
51927951040fSNavdeep Parhar 		for (m = txsd->m; m != NULL; m = nextpkt) {
51937951040fSNavdeep Parhar 			nextpkt = m->m_nextpkt;
51947951040fSNavdeep Parhar 			m->m_nextpkt = NULL;
51957951040fSNavdeep Parhar 			m_freem(m);
51967951040fSNavdeep Parhar 		}
519754e4ee71SNavdeep Parhar 		reclaimed += ndesc;
519854e4ee71SNavdeep Parhar 		can_reclaim -= ndesc;
51997951040fSNavdeep Parhar 		IDXINCR(eq->cidx, ndesc, eq->sidx);
520054e4ee71SNavdeep Parhar 	}
520154e4ee71SNavdeep Parhar 
520254e4ee71SNavdeep Parhar 	return (reclaimed);
520354e4ee71SNavdeep Parhar }
520454e4ee71SNavdeep Parhar 
520554e4ee71SNavdeep Parhar static void
52067951040fSNavdeep Parhar tx_reclaim(void *arg, int n)
520754e4ee71SNavdeep Parhar {
52087951040fSNavdeep Parhar 	struct sge_txq *txq = arg;
52097951040fSNavdeep Parhar 	struct sge_eq *eq = &txq->eq;
521054e4ee71SNavdeep Parhar 
52117951040fSNavdeep Parhar 	do {
52127951040fSNavdeep Parhar 		if (TXQ_TRYLOCK(txq) == 0)
52137951040fSNavdeep Parhar 			break;
52147951040fSNavdeep Parhar 		n = reclaim_tx_descs(txq, 32);
52157951040fSNavdeep Parhar 		if (eq->cidx == eq->pidx)
52167951040fSNavdeep Parhar 			eq->equeqidx = eq->pidx;
52177951040fSNavdeep Parhar 		TXQ_UNLOCK(txq);
52187951040fSNavdeep Parhar 	} while (n > 0);
521954e4ee71SNavdeep Parhar }
522054e4ee71SNavdeep Parhar 
522154e4ee71SNavdeep Parhar static __be64
52227951040fSNavdeep Parhar get_flit(struct sglist_seg *segs, int nsegs, int idx)
522354e4ee71SNavdeep Parhar {
522454e4ee71SNavdeep Parhar 	int i = (idx / 3) * 2;
522554e4ee71SNavdeep Parhar 
522654e4ee71SNavdeep Parhar 	switch (idx % 3) {
522754e4ee71SNavdeep Parhar 	case 0: {
5228f078ecf6SWojciech Macek 		uint64_t rc;
522954e4ee71SNavdeep Parhar 
5230f078ecf6SWojciech Macek 		rc = (uint64_t)segs[i].ss_len << 32;
523154e4ee71SNavdeep Parhar 		if (i + 1 < nsegs)
5232f078ecf6SWojciech Macek 			rc |= (uint64_t)(segs[i + 1].ss_len);
523354e4ee71SNavdeep Parhar 
5234f078ecf6SWojciech Macek 		return (htobe64(rc));
523554e4ee71SNavdeep Parhar 	}
523654e4ee71SNavdeep Parhar 	case 1:
52377951040fSNavdeep Parhar 		return (htobe64(segs[i].ss_paddr));
523854e4ee71SNavdeep Parhar 	case 2:
52397951040fSNavdeep Parhar 		return (htobe64(segs[i + 1].ss_paddr));
524054e4ee71SNavdeep Parhar 	}
524154e4ee71SNavdeep Parhar 
524254e4ee71SNavdeep Parhar 	return (0);
524354e4ee71SNavdeep Parhar }
524454e4ee71SNavdeep Parhar 
524554e4ee71SNavdeep Parhar static void
524638035ed6SNavdeep Parhar find_best_refill_source(struct adapter *sc, struct sge_fl *fl, int maxp)
524754e4ee71SNavdeep Parhar {
524838035ed6SNavdeep Parhar 	int8_t zidx, hwidx, idx;
524938035ed6SNavdeep Parhar 	uint16_t region1, region3;
525038035ed6SNavdeep Parhar 	int spare, spare_needed, n;
525138035ed6SNavdeep Parhar 	struct sw_zone_info *swz;
525238035ed6SNavdeep Parhar 	struct hw_buf_info *hwb, *hwb_list = &sc->sge.hw_buf_info[0];
525354e4ee71SNavdeep Parhar 
525438035ed6SNavdeep Parhar 	/*
525538035ed6SNavdeep Parhar 	 * Buffer Packing: Look for PAGE_SIZE or larger zone which has a bufsize
525638035ed6SNavdeep Parhar 	 * large enough for the max payload and cluster metadata.  Otherwise
525738035ed6SNavdeep Parhar 	 * settle for the largest bufsize that leaves enough room in the cluster
525838035ed6SNavdeep Parhar 	 * for metadata.
525938035ed6SNavdeep Parhar 	 *
526038035ed6SNavdeep Parhar 	 * Without buffer packing: Look for the smallest zone which has a
526138035ed6SNavdeep Parhar 	 * bufsize large enough for the max payload.  Settle for the largest
526238035ed6SNavdeep Parhar 	 * bufsize available if there's nothing big enough for max payload.
526338035ed6SNavdeep Parhar 	 */
526438035ed6SNavdeep Parhar 	spare_needed = fl->flags & FL_BUF_PACKING ? CL_METADATA_SIZE : 0;
526538035ed6SNavdeep Parhar 	swz = &sc->sge.sw_zone_info[0];
526638035ed6SNavdeep Parhar 	hwidx = -1;
526738035ed6SNavdeep Parhar 	for (zidx = 0; zidx < SW_ZONE_SIZES; zidx++, swz++) {
526838035ed6SNavdeep Parhar 		if (swz->size > largest_rx_cluster) {
526938035ed6SNavdeep Parhar 			if (__predict_true(hwidx != -1))
527038035ed6SNavdeep Parhar 				break;
527138035ed6SNavdeep Parhar 
527238035ed6SNavdeep Parhar 			/*
527338035ed6SNavdeep Parhar 			 * This is a misconfiguration.  largest_rx_cluster is
527438035ed6SNavdeep Parhar 			 * preventing us from finding a refill source.  See
527538035ed6SNavdeep Parhar 			 * dev.t5nex.<n>.buffer_sizes to figure out why.
527638035ed6SNavdeep Parhar 			 */
527738035ed6SNavdeep Parhar 			device_printf(sc->dev, "largest_rx_cluster=%u leaves no"
527838035ed6SNavdeep Parhar 			    " refill source for fl %p (dma %u).  Ignored.\n",
527938035ed6SNavdeep Parhar 			    largest_rx_cluster, fl, maxp);
528038035ed6SNavdeep Parhar 		}
528138035ed6SNavdeep Parhar 		for (idx = swz->head_hwidx; idx != -1; idx = hwb->next) {
528238035ed6SNavdeep Parhar 			hwb = &hwb_list[idx];
528338035ed6SNavdeep Parhar 			spare = swz->size - hwb->size;
528438035ed6SNavdeep Parhar 			if (spare < spare_needed)
528538035ed6SNavdeep Parhar 				continue;
528638035ed6SNavdeep Parhar 
528738035ed6SNavdeep Parhar 			hwidx = idx;		/* best option so far */
528838035ed6SNavdeep Parhar 			if (hwb->size >= maxp) {
528938035ed6SNavdeep Parhar 
529038035ed6SNavdeep Parhar 				if ((fl->flags & FL_BUF_PACKING) == 0)
529138035ed6SNavdeep Parhar 					goto done; /* stop looking (not packing) */
529238035ed6SNavdeep Parhar 
529338035ed6SNavdeep Parhar 				if (swz->size >= safest_rx_cluster)
529438035ed6SNavdeep Parhar 					goto done; /* stop looking (packing) */
529538035ed6SNavdeep Parhar 			}
529638035ed6SNavdeep Parhar 			break;		/* keep looking, next zone */
529738035ed6SNavdeep Parhar 		}
529838035ed6SNavdeep Parhar 	}
529938035ed6SNavdeep Parhar done:
530038035ed6SNavdeep Parhar 	/* A usable hwidx has been located. */
530138035ed6SNavdeep Parhar 	MPASS(hwidx != -1);
530238035ed6SNavdeep Parhar 	hwb = &hwb_list[hwidx];
530338035ed6SNavdeep Parhar 	zidx = hwb->zidx;
530438035ed6SNavdeep Parhar 	swz = &sc->sge.sw_zone_info[zidx];
530538035ed6SNavdeep Parhar 	region1 = 0;
530638035ed6SNavdeep Parhar 	region3 = swz->size - hwb->size;
530738035ed6SNavdeep Parhar 
530838035ed6SNavdeep Parhar 	/*
530938035ed6SNavdeep Parhar 	 * Stay within this zone and see if there is a better match when mbuf
531038035ed6SNavdeep Parhar 	 * inlining is allowed.  Remember that the hwidx's are sorted in
531138035ed6SNavdeep Parhar 	 * decreasing order of size (so in increasing order of spare area).
531238035ed6SNavdeep Parhar 	 */
531338035ed6SNavdeep Parhar 	for (idx = hwidx; idx != -1; idx = hwb->next) {
531438035ed6SNavdeep Parhar 		hwb = &hwb_list[idx];
531538035ed6SNavdeep Parhar 		spare = swz->size - hwb->size;
531638035ed6SNavdeep Parhar 
531738035ed6SNavdeep Parhar 		if (allow_mbufs_in_cluster == 0 || hwb->size < maxp)
531838035ed6SNavdeep Parhar 			break;
5319e3207e19SNavdeep Parhar 
5320e3207e19SNavdeep Parhar 		/*
5321e3207e19SNavdeep Parhar 		 * Do not inline mbufs if doing so would violate the pad/pack
5322e3207e19SNavdeep Parhar 		 * boundary alignment requirement.
5323e3207e19SNavdeep Parhar 		 */
532490e7434aSNavdeep Parhar 		if (fl_pad && (MSIZE % sc->params.sge.pad_boundary) != 0)
5325e3207e19SNavdeep Parhar 			continue;
5326e3207e19SNavdeep Parhar 		if (fl->flags & FL_BUF_PACKING &&
532790e7434aSNavdeep Parhar 		    (MSIZE % sc->params.sge.pack_boundary) != 0)
5328e3207e19SNavdeep Parhar 			continue;
5329e3207e19SNavdeep Parhar 
533038035ed6SNavdeep Parhar 		if (spare < CL_METADATA_SIZE + MSIZE)
533138035ed6SNavdeep Parhar 			continue;
533238035ed6SNavdeep Parhar 		n = (spare - CL_METADATA_SIZE) / MSIZE;
533338035ed6SNavdeep Parhar 		if (n > howmany(hwb->size, maxp))
533438035ed6SNavdeep Parhar 			break;
533538035ed6SNavdeep Parhar 
533638035ed6SNavdeep Parhar 		hwidx = idx;
53371458bff9SNavdeep Parhar 		if (fl->flags & FL_BUF_PACKING) {
533838035ed6SNavdeep Parhar 			region1 = n * MSIZE;
533938035ed6SNavdeep Parhar 			region3 = spare - region1;
534038035ed6SNavdeep Parhar 		} else {
534138035ed6SNavdeep Parhar 			region1 = MSIZE;
534238035ed6SNavdeep Parhar 			region3 = spare - region1;
534338035ed6SNavdeep Parhar 			break;
534438035ed6SNavdeep Parhar 		}
534538035ed6SNavdeep Parhar 	}
534638035ed6SNavdeep Parhar 
534738035ed6SNavdeep Parhar 	KASSERT(zidx >= 0 && zidx < SW_ZONE_SIZES,
534838035ed6SNavdeep Parhar 	    ("%s: bad zone %d for fl %p, maxp %d", __func__, zidx, fl, maxp));
534938035ed6SNavdeep Parhar 	KASSERT(hwidx >= 0 && hwidx <= SGE_FLBUF_SIZES,
535038035ed6SNavdeep Parhar 	    ("%s: bad hwidx %d for fl %p, maxp %d", __func__, hwidx, fl, maxp));
535138035ed6SNavdeep Parhar 	KASSERT(region1 + sc->sge.hw_buf_info[hwidx].size + region3 ==
535238035ed6SNavdeep Parhar 	    sc->sge.sw_zone_info[zidx].size,
535338035ed6SNavdeep Parhar 	    ("%s: bad buffer layout for fl %p, maxp %d. "
535438035ed6SNavdeep Parhar 		"cl %d; r1 %d, payload %d, r3 %d", __func__, fl, maxp,
535538035ed6SNavdeep Parhar 		sc->sge.sw_zone_info[zidx].size, region1,
535638035ed6SNavdeep Parhar 		sc->sge.hw_buf_info[hwidx].size, region3));
535738035ed6SNavdeep Parhar 	if (fl->flags & FL_BUF_PACKING || region1 > 0) {
535838035ed6SNavdeep Parhar 		KASSERT(region3 >= CL_METADATA_SIZE,
535938035ed6SNavdeep Parhar 		    ("%s: no room for metadata.  fl %p, maxp %d; "
536038035ed6SNavdeep Parhar 		    "cl %d; r1 %d, payload %d, r3 %d", __func__, fl, maxp,
536138035ed6SNavdeep Parhar 		    sc->sge.sw_zone_info[zidx].size, region1,
536238035ed6SNavdeep Parhar 		    sc->sge.hw_buf_info[hwidx].size, region3));
536338035ed6SNavdeep Parhar 		KASSERT(region1 % MSIZE == 0,
536438035ed6SNavdeep Parhar 		    ("%s: bad mbuf region for fl %p, maxp %d. "
536538035ed6SNavdeep Parhar 		    "cl %d; r1 %d, payload %d, r3 %d", __func__, fl, maxp,
536638035ed6SNavdeep Parhar 		    sc->sge.sw_zone_info[zidx].size, region1,
536738035ed6SNavdeep Parhar 		    sc->sge.hw_buf_info[hwidx].size, region3));
536838035ed6SNavdeep Parhar 	}
536938035ed6SNavdeep Parhar 
537038035ed6SNavdeep Parhar 	fl->cll_def.zidx = zidx;
537138035ed6SNavdeep Parhar 	fl->cll_def.hwidx = hwidx;
537238035ed6SNavdeep Parhar 	fl->cll_def.region1 = region1;
537338035ed6SNavdeep Parhar 	fl->cll_def.region3 = region3;
537438035ed6SNavdeep Parhar }
537538035ed6SNavdeep Parhar 
537638035ed6SNavdeep Parhar static void
537738035ed6SNavdeep Parhar find_safe_refill_source(struct adapter *sc, struct sge_fl *fl)
537838035ed6SNavdeep Parhar {
537938035ed6SNavdeep Parhar 	struct sge *s = &sc->sge;
538038035ed6SNavdeep Parhar 	struct hw_buf_info *hwb;
538138035ed6SNavdeep Parhar 	struct sw_zone_info *swz;
538238035ed6SNavdeep Parhar 	int spare;
538338035ed6SNavdeep Parhar 	int8_t hwidx;
538438035ed6SNavdeep Parhar 
538538035ed6SNavdeep Parhar 	if (fl->flags & FL_BUF_PACKING)
538638035ed6SNavdeep Parhar 		hwidx = s->safe_hwidx2;	/* with room for metadata */
538738035ed6SNavdeep Parhar 	else if (allow_mbufs_in_cluster && s->safe_hwidx2 != -1) {
538838035ed6SNavdeep Parhar 		hwidx = s->safe_hwidx2;
538938035ed6SNavdeep Parhar 		hwb = &s->hw_buf_info[hwidx];
539038035ed6SNavdeep Parhar 		swz = &s->sw_zone_info[hwb->zidx];
539138035ed6SNavdeep Parhar 		spare = swz->size - hwb->size;
539238035ed6SNavdeep Parhar 
539338035ed6SNavdeep Parhar 		/* no good if there isn't room for an mbuf as well */
539438035ed6SNavdeep Parhar 		if (spare < CL_METADATA_SIZE + MSIZE)
539538035ed6SNavdeep Parhar 			hwidx = s->safe_hwidx1;
539638035ed6SNavdeep Parhar 	} else
539738035ed6SNavdeep Parhar 		hwidx = s->safe_hwidx1;
539838035ed6SNavdeep Parhar 
539938035ed6SNavdeep Parhar 	if (hwidx == -1) {
540038035ed6SNavdeep Parhar 		/* No fallback source */
540138035ed6SNavdeep Parhar 		fl->cll_alt.hwidx = -1;
540238035ed6SNavdeep Parhar 		fl->cll_alt.zidx = -1;
540338035ed6SNavdeep Parhar 
54041458bff9SNavdeep Parhar 		return;
540554e4ee71SNavdeep Parhar 	}
540654e4ee71SNavdeep Parhar 
540738035ed6SNavdeep Parhar 	hwb = &s->hw_buf_info[hwidx];
540838035ed6SNavdeep Parhar 	swz = &s->sw_zone_info[hwb->zidx];
540938035ed6SNavdeep Parhar 	spare = swz->size - hwb->size;
541038035ed6SNavdeep Parhar 	fl->cll_alt.hwidx = hwidx;
541138035ed6SNavdeep Parhar 	fl->cll_alt.zidx = hwb->zidx;
5412e3207e19SNavdeep Parhar 	if (allow_mbufs_in_cluster &&
541390e7434aSNavdeep Parhar 	    (fl_pad == 0 || (MSIZE % sc->params.sge.pad_boundary) == 0))
541438035ed6SNavdeep Parhar 		fl->cll_alt.region1 = ((spare - CL_METADATA_SIZE) / MSIZE) * MSIZE;
54151458bff9SNavdeep Parhar 	else
541638035ed6SNavdeep Parhar 		fl->cll_alt.region1 = 0;
541738035ed6SNavdeep Parhar 	fl->cll_alt.region3 = spare - fl->cll_alt.region1;
541854e4ee71SNavdeep Parhar }
5419ecb79ca4SNavdeep Parhar 
5420733b9277SNavdeep Parhar static void
5421733b9277SNavdeep Parhar add_fl_to_sfl(struct adapter *sc, struct sge_fl *fl)
5422ecb79ca4SNavdeep Parhar {
5423733b9277SNavdeep Parhar 	mtx_lock(&sc->sfl_lock);
5424733b9277SNavdeep Parhar 	FL_LOCK(fl);
5425733b9277SNavdeep Parhar 	if ((fl->flags & FL_DOOMED) == 0) {
5426733b9277SNavdeep Parhar 		fl->flags |= FL_STARVING;
5427733b9277SNavdeep Parhar 		TAILQ_INSERT_TAIL(&sc->sfl, fl, link);
5428733b9277SNavdeep Parhar 		callout_reset(&sc->sfl_callout, hz / 5, refill_sfl, sc);
5429733b9277SNavdeep Parhar 	}
5430733b9277SNavdeep Parhar 	FL_UNLOCK(fl);
5431733b9277SNavdeep Parhar 	mtx_unlock(&sc->sfl_lock);
5432733b9277SNavdeep Parhar }
5433ecb79ca4SNavdeep Parhar 
54347951040fSNavdeep Parhar static void
54357951040fSNavdeep Parhar handle_wrq_egr_update(struct adapter *sc, struct sge_eq *eq)
54367951040fSNavdeep Parhar {
54377951040fSNavdeep Parhar 	struct sge_wrq *wrq = (void *)eq;
54387951040fSNavdeep Parhar 
54397951040fSNavdeep Parhar 	atomic_readandclear_int(&eq->equiq);
54407951040fSNavdeep Parhar 	taskqueue_enqueue(sc->tq[eq->tx_chan], &wrq->wrq_tx_task);
54417951040fSNavdeep Parhar }
54427951040fSNavdeep Parhar 
54437951040fSNavdeep Parhar static void
54447951040fSNavdeep Parhar handle_eth_egr_update(struct adapter *sc, struct sge_eq *eq)
54457951040fSNavdeep Parhar {
54467951040fSNavdeep Parhar 	struct sge_txq *txq = (void *)eq;
54477951040fSNavdeep Parhar 
54487951040fSNavdeep Parhar 	MPASS((eq->flags & EQ_TYPEMASK) == EQ_ETH);
54497951040fSNavdeep Parhar 
54507951040fSNavdeep Parhar 	atomic_readandclear_int(&eq->equiq);
54517951040fSNavdeep Parhar 	mp_ring_check_drainage(txq->r, 0);
54527951040fSNavdeep Parhar 	taskqueue_enqueue(sc->tq[eq->tx_chan], &txq->tx_reclaim_task);
54537951040fSNavdeep Parhar }
54547951040fSNavdeep Parhar 
5455733b9277SNavdeep Parhar static int
5456733b9277SNavdeep Parhar handle_sge_egr_update(struct sge_iq *iq, const struct rss_header *rss,
5457733b9277SNavdeep Parhar     struct mbuf *m)
5458733b9277SNavdeep Parhar {
5459733b9277SNavdeep Parhar 	const struct cpl_sge_egr_update *cpl = (const void *)(rss + 1);
5460733b9277SNavdeep Parhar 	unsigned int qid = G_EGR_QID(ntohl(cpl->opcode_qid));
5461733b9277SNavdeep Parhar 	struct adapter *sc = iq->adapter;
5462733b9277SNavdeep Parhar 	struct sge *s = &sc->sge;
5463733b9277SNavdeep Parhar 	struct sge_eq *eq;
54647951040fSNavdeep Parhar 	static void (*h[])(struct adapter *, struct sge_eq *) = {NULL,
54657951040fSNavdeep Parhar 		&handle_wrq_egr_update, &handle_eth_egr_update,
54667951040fSNavdeep Parhar 		&handle_wrq_egr_update};
5467733b9277SNavdeep Parhar 
5468733b9277SNavdeep Parhar 	KASSERT(m == NULL, ("%s: payload with opcode %02x", __func__,
5469733b9277SNavdeep Parhar 	    rss->opcode));
5470733b9277SNavdeep Parhar 
5471ec55567cSJohn Baldwin 	eq = s->eqmap[qid - s->eq_start - s->eq_base];
54727951040fSNavdeep Parhar 	(*h[eq->flags & EQ_TYPEMASK])(sc, eq);
5473ecb79ca4SNavdeep Parhar 
5474ecb79ca4SNavdeep Parhar 	return (0);
5475ecb79ca4SNavdeep Parhar }
5476f7dfe243SNavdeep Parhar 
54770abd31e2SNavdeep Parhar /* handle_fw_msg works for both fw4_msg and fw6_msg because this is valid */
54780abd31e2SNavdeep Parhar CTASSERT(offsetof(struct cpl_fw4_msg, data) == \
54790abd31e2SNavdeep Parhar     offsetof(struct cpl_fw6_msg, data));
54800abd31e2SNavdeep Parhar 
5481733b9277SNavdeep Parhar static int
54821b4cc91fSNavdeep Parhar handle_fw_msg(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m)
548356599263SNavdeep Parhar {
54841b4cc91fSNavdeep Parhar 	struct adapter *sc = iq->adapter;
548556599263SNavdeep Parhar 	const struct cpl_fw6_msg *cpl = (const void *)(rss + 1);
548656599263SNavdeep Parhar 
5487733b9277SNavdeep Parhar 	KASSERT(m == NULL, ("%s: payload with opcode %02x", __func__,
5488733b9277SNavdeep Parhar 	    rss->opcode));
5489733b9277SNavdeep Parhar 
54900abd31e2SNavdeep Parhar 	if (cpl->type == FW_TYPE_RSSCPL || cpl->type == FW6_TYPE_RSSCPL) {
54910abd31e2SNavdeep Parhar 		const struct rss_header *rss2;
54920abd31e2SNavdeep Parhar 
54930abd31e2SNavdeep Parhar 		rss2 = (const struct rss_header *)&cpl->data[0];
5494671bf2b8SNavdeep Parhar 		return (t4_cpl_handler[rss2->opcode](iq, rss2, m));
54950abd31e2SNavdeep Parhar 	}
54960abd31e2SNavdeep Parhar 
5497671bf2b8SNavdeep Parhar 	return (t4_fw_msg_handler[cpl->type](sc, &cpl->data[0]));
5498f7dfe243SNavdeep Parhar }
5499af49c942SNavdeep Parhar 
5500069af0ebSJohn Baldwin /**
5501069af0ebSJohn Baldwin  *	t4_handle_wrerr_rpl - process a FW work request error message
5502069af0ebSJohn Baldwin  *	@adap: the adapter
5503069af0ebSJohn Baldwin  *	@rpl: start of the FW message
5504069af0ebSJohn Baldwin  */
5505069af0ebSJohn Baldwin static int
5506069af0ebSJohn Baldwin t4_handle_wrerr_rpl(struct adapter *adap, const __be64 *rpl)
5507069af0ebSJohn Baldwin {
5508069af0ebSJohn Baldwin 	u8 opcode = *(const u8 *)rpl;
5509069af0ebSJohn Baldwin 	const struct fw_error_cmd *e = (const void *)rpl;
5510069af0ebSJohn Baldwin 	unsigned int i;
5511069af0ebSJohn Baldwin 
5512069af0ebSJohn Baldwin 	if (opcode != FW_ERROR_CMD) {
5513069af0ebSJohn Baldwin 		log(LOG_ERR,
5514069af0ebSJohn Baldwin 		    "%s: Received WRERR_RPL message with opcode %#x\n",
5515069af0ebSJohn Baldwin 		    device_get_nameunit(adap->dev), opcode);
5516069af0ebSJohn Baldwin 		return (EINVAL);
5517069af0ebSJohn Baldwin 	}
5518069af0ebSJohn Baldwin 	log(LOG_ERR, "%s: FW_ERROR (%s) ", device_get_nameunit(adap->dev),
5519069af0ebSJohn Baldwin 	    G_FW_ERROR_CMD_FATAL(be32toh(e->op_to_type)) ? "fatal" :
5520069af0ebSJohn Baldwin 	    "non-fatal");
5521069af0ebSJohn Baldwin 	switch (G_FW_ERROR_CMD_TYPE(be32toh(e->op_to_type))) {
5522069af0ebSJohn Baldwin 	case FW_ERROR_TYPE_EXCEPTION:
5523069af0ebSJohn Baldwin 		log(LOG_ERR, "exception info:\n");
5524069af0ebSJohn Baldwin 		for (i = 0; i < nitems(e->u.exception.info); i++)
5525069af0ebSJohn Baldwin 			log(LOG_ERR, "%s%08x", i == 0 ? "\t" : " ",
5526069af0ebSJohn Baldwin 			    be32toh(e->u.exception.info[i]));
5527069af0ebSJohn Baldwin 		log(LOG_ERR, "\n");
5528069af0ebSJohn Baldwin 		break;
5529069af0ebSJohn Baldwin 	case FW_ERROR_TYPE_HWMODULE:
5530069af0ebSJohn Baldwin 		log(LOG_ERR, "HW module regaddr %08x regval %08x\n",
5531069af0ebSJohn Baldwin 		    be32toh(e->u.hwmodule.regaddr),
5532069af0ebSJohn Baldwin 		    be32toh(e->u.hwmodule.regval));
5533069af0ebSJohn Baldwin 		break;
5534069af0ebSJohn Baldwin 	case FW_ERROR_TYPE_WR:
5535069af0ebSJohn Baldwin 		log(LOG_ERR, "WR cidx %d PF %d VF %d eqid %d hdr:\n",
5536069af0ebSJohn Baldwin 		    be16toh(e->u.wr.cidx),
5537069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_PFN(be16toh(e->u.wr.pfn_vfn)),
5538069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_VFN(be16toh(e->u.wr.pfn_vfn)),
5539069af0ebSJohn Baldwin 		    be32toh(e->u.wr.eqid));
5540069af0ebSJohn Baldwin 		for (i = 0; i < nitems(e->u.wr.wrhdr); i++)
5541069af0ebSJohn Baldwin 			log(LOG_ERR, "%s%02x", i == 0 ? "\t" : " ",
5542069af0ebSJohn Baldwin 			    e->u.wr.wrhdr[i]);
5543069af0ebSJohn Baldwin 		log(LOG_ERR, "\n");
5544069af0ebSJohn Baldwin 		break;
5545069af0ebSJohn Baldwin 	case FW_ERROR_TYPE_ACL:
5546069af0ebSJohn Baldwin 		log(LOG_ERR, "ACL cidx %d PF %d VF %d eqid %d %s",
5547069af0ebSJohn Baldwin 		    be16toh(e->u.acl.cidx),
5548069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_PFN(be16toh(e->u.acl.pfn_vfn)),
5549069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_VFN(be16toh(e->u.acl.pfn_vfn)),
5550069af0ebSJohn Baldwin 		    be32toh(e->u.acl.eqid),
5551069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_MV(be16toh(e->u.acl.mv_pkd)) ? "vlanid" :
5552069af0ebSJohn Baldwin 		    "MAC");
5553069af0ebSJohn Baldwin 		for (i = 0; i < nitems(e->u.acl.val); i++)
5554069af0ebSJohn Baldwin 			log(LOG_ERR, " %02x", e->u.acl.val[i]);
5555069af0ebSJohn Baldwin 		log(LOG_ERR, "\n");
5556069af0ebSJohn Baldwin 		break;
5557069af0ebSJohn Baldwin 	default:
5558069af0ebSJohn Baldwin 		log(LOG_ERR, "type %#x\n",
5559069af0ebSJohn Baldwin 		    G_FW_ERROR_CMD_TYPE(be32toh(e->op_to_type)));
5560069af0ebSJohn Baldwin 		return (EINVAL);
5561069af0ebSJohn Baldwin 	}
5562069af0ebSJohn Baldwin 	return (0);
5563069af0ebSJohn Baldwin }
5564069af0ebSJohn Baldwin 
5565af49c942SNavdeep Parhar static int
556656599263SNavdeep Parhar sysctl_uint16(SYSCTL_HANDLER_ARGS)
5567af49c942SNavdeep Parhar {
5568af49c942SNavdeep Parhar 	uint16_t *id = arg1;
5569af49c942SNavdeep Parhar 	int i = *id;
5570af49c942SNavdeep Parhar 
5571af49c942SNavdeep Parhar 	return sysctl_handle_int(oidp, &i, 0, req);
5572af49c942SNavdeep Parhar }
557338035ed6SNavdeep Parhar 
557438035ed6SNavdeep Parhar static int
557538035ed6SNavdeep Parhar sysctl_bufsizes(SYSCTL_HANDLER_ARGS)
557638035ed6SNavdeep Parhar {
557738035ed6SNavdeep Parhar 	struct sge *s = arg1;
557838035ed6SNavdeep Parhar 	struct hw_buf_info *hwb = &s->hw_buf_info[0];
557938035ed6SNavdeep Parhar 	struct sw_zone_info *swz = &s->sw_zone_info[0];
558038035ed6SNavdeep Parhar 	int i, rc;
558138035ed6SNavdeep Parhar 	struct sbuf sb;
558238035ed6SNavdeep Parhar 	char c;
558338035ed6SNavdeep Parhar 
558438035ed6SNavdeep Parhar 	sbuf_new(&sb, NULL, 32, SBUF_AUTOEXTEND);
558538035ed6SNavdeep Parhar 	for (i = 0; i < SGE_FLBUF_SIZES; i++, hwb++) {
558638035ed6SNavdeep Parhar 		if (hwb->zidx >= 0 && swz[hwb->zidx].size <= largest_rx_cluster)
558738035ed6SNavdeep Parhar 			c = '*';
558838035ed6SNavdeep Parhar 		else
558938035ed6SNavdeep Parhar 			c = '\0';
559038035ed6SNavdeep Parhar 
559138035ed6SNavdeep Parhar 		sbuf_printf(&sb, "%u%c ", hwb->size, c);
559238035ed6SNavdeep Parhar 	}
559338035ed6SNavdeep Parhar 	sbuf_trim(&sb);
559438035ed6SNavdeep Parhar 	sbuf_finish(&sb);
559538035ed6SNavdeep Parhar 	rc = sysctl_handle_string(oidp, sbuf_data(&sb), sbuf_len(&sb), req);
559638035ed6SNavdeep Parhar 	sbuf_delete(&sb);
559738035ed6SNavdeep Parhar 	return (rc);
559838035ed6SNavdeep Parhar }
559902f972e8SNavdeep Parhar 
5600786099deSNavdeep Parhar #ifdef RATELIMIT
5601786099deSNavdeep Parhar /*
5602786099deSNavdeep Parhar  * len16 for a txpkt WR with a GL.  Includes the firmware work request header.
5603786099deSNavdeep Parhar  */
5604786099deSNavdeep Parhar static inline u_int
5605786099deSNavdeep Parhar txpkt_eo_len16(u_int nsegs, u_int immhdrs, u_int tso)
5606786099deSNavdeep Parhar {
5607786099deSNavdeep Parhar 	u_int n;
5608786099deSNavdeep Parhar 
5609786099deSNavdeep Parhar 	MPASS(immhdrs > 0);
5610786099deSNavdeep Parhar 
5611786099deSNavdeep Parhar 	n = roundup2(sizeof(struct fw_eth_tx_eo_wr) +
5612786099deSNavdeep Parhar 	    sizeof(struct cpl_tx_pkt_core) + immhdrs, 16);
5613786099deSNavdeep Parhar 	if (__predict_false(nsegs == 0))
5614786099deSNavdeep Parhar 		goto done;
5615786099deSNavdeep Parhar 
5616786099deSNavdeep Parhar 	nsegs--; /* first segment is part of ulptx_sgl */
5617786099deSNavdeep Parhar 	n += sizeof(struct ulptx_sgl) + 8 * ((3 * nsegs) / 2 + (nsegs & 1));
5618786099deSNavdeep Parhar 	if (tso)
5619786099deSNavdeep Parhar 		n += sizeof(struct cpl_tx_pkt_lso_core);
5620786099deSNavdeep Parhar 
5621786099deSNavdeep Parhar done:
5622786099deSNavdeep Parhar 	return (howmany(n, 16));
5623786099deSNavdeep Parhar }
5624786099deSNavdeep Parhar 
5625786099deSNavdeep Parhar #define ETID_FLOWC_NPARAMS 6
5626786099deSNavdeep Parhar #define ETID_FLOWC_LEN (roundup2((sizeof(struct fw_flowc_wr) + \
5627786099deSNavdeep Parhar     ETID_FLOWC_NPARAMS * sizeof(struct fw_flowc_mnemval)), 16))
5628786099deSNavdeep Parhar #define ETID_FLOWC_LEN16 (howmany(ETID_FLOWC_LEN, 16))
5629786099deSNavdeep Parhar 
5630786099deSNavdeep Parhar static int
5631786099deSNavdeep Parhar send_etid_flowc_wr(struct cxgbe_snd_tag *cst, struct port_info *pi,
5632786099deSNavdeep Parhar     struct vi_info *vi)
5633786099deSNavdeep Parhar {
5634786099deSNavdeep Parhar 	struct wrq_cookie cookie;
5635786099deSNavdeep Parhar 	u_int pfvf = G_FW_VIID_PFN(vi->viid) << S_FW_VIID_PFN;
5636786099deSNavdeep Parhar 	struct fw_flowc_wr *flowc;
5637786099deSNavdeep Parhar 
5638786099deSNavdeep Parhar 	mtx_assert(&cst->lock, MA_OWNED);
5639786099deSNavdeep Parhar 	MPASS((cst->flags & (EO_FLOWC_PENDING | EO_FLOWC_RPL_PENDING)) ==
5640786099deSNavdeep Parhar 	    EO_FLOWC_PENDING);
5641786099deSNavdeep Parhar 
5642786099deSNavdeep Parhar 	flowc = start_wrq_wr(cst->eo_txq, ETID_FLOWC_LEN16, &cookie);
5643786099deSNavdeep Parhar 	if (__predict_false(flowc == NULL))
5644786099deSNavdeep Parhar 		return (ENOMEM);
5645786099deSNavdeep Parhar 
5646786099deSNavdeep Parhar 	bzero(flowc, ETID_FLOWC_LEN);
5647786099deSNavdeep Parhar 	flowc->op_to_nparams = htobe32(V_FW_WR_OP(FW_FLOWC_WR) |
5648786099deSNavdeep Parhar 	    V_FW_FLOWC_WR_NPARAMS(ETID_FLOWC_NPARAMS) | V_FW_WR_COMPL(0));
5649786099deSNavdeep Parhar 	flowc->flowid_len16 = htonl(V_FW_WR_LEN16(ETID_FLOWC_LEN16) |
5650786099deSNavdeep Parhar 	    V_FW_WR_FLOWID(cst->etid));
5651786099deSNavdeep Parhar 	flowc->mnemval[0].mnemonic = FW_FLOWC_MNEM_PFNVFN;
5652786099deSNavdeep Parhar 	flowc->mnemval[0].val = htobe32(pfvf);
5653786099deSNavdeep Parhar 	flowc->mnemval[1].mnemonic = FW_FLOWC_MNEM_CH;
5654786099deSNavdeep Parhar 	flowc->mnemval[1].val = htobe32(pi->tx_chan);
5655786099deSNavdeep Parhar 	flowc->mnemval[2].mnemonic = FW_FLOWC_MNEM_PORT;
5656786099deSNavdeep Parhar 	flowc->mnemval[2].val = htobe32(pi->tx_chan);
5657786099deSNavdeep Parhar 	flowc->mnemval[3].mnemonic = FW_FLOWC_MNEM_IQID;
5658786099deSNavdeep Parhar 	flowc->mnemval[3].val = htobe32(cst->iqid);
5659786099deSNavdeep Parhar 	flowc->mnemval[4].mnemonic = FW_FLOWC_MNEM_EOSTATE;
5660786099deSNavdeep Parhar 	flowc->mnemval[4].val = htobe32(FW_FLOWC_MNEM_EOSTATE_ESTABLISHED);
5661786099deSNavdeep Parhar 	flowc->mnemval[5].mnemonic = FW_FLOWC_MNEM_SCHEDCLASS;
5662786099deSNavdeep Parhar 	flowc->mnemval[5].val = htobe32(cst->schedcl);
5663786099deSNavdeep Parhar 
5664786099deSNavdeep Parhar 	commit_wrq_wr(cst->eo_txq, flowc, &cookie);
5665786099deSNavdeep Parhar 
5666786099deSNavdeep Parhar 	cst->flags &= ~EO_FLOWC_PENDING;
5667786099deSNavdeep Parhar 	cst->flags |= EO_FLOWC_RPL_PENDING;
5668786099deSNavdeep Parhar 	MPASS(cst->tx_credits >= ETID_FLOWC_LEN16);	/* flowc is first WR. */
5669786099deSNavdeep Parhar 	cst->tx_credits -= ETID_FLOWC_LEN16;
5670786099deSNavdeep Parhar 
5671786099deSNavdeep Parhar 	return (0);
5672786099deSNavdeep Parhar }
5673786099deSNavdeep Parhar 
5674786099deSNavdeep Parhar #define ETID_FLUSH_LEN16 (howmany(sizeof (struct fw_flowc_wr), 16))
5675786099deSNavdeep Parhar 
5676786099deSNavdeep Parhar void
5677786099deSNavdeep Parhar send_etid_flush_wr(struct cxgbe_snd_tag *cst)
5678786099deSNavdeep Parhar {
5679786099deSNavdeep Parhar 	struct fw_flowc_wr *flowc;
5680786099deSNavdeep Parhar 	struct wrq_cookie cookie;
5681786099deSNavdeep Parhar 
5682786099deSNavdeep Parhar 	mtx_assert(&cst->lock, MA_OWNED);
5683786099deSNavdeep Parhar 
5684786099deSNavdeep Parhar 	flowc = start_wrq_wr(cst->eo_txq, ETID_FLUSH_LEN16, &cookie);
5685786099deSNavdeep Parhar 	if (__predict_false(flowc == NULL))
5686786099deSNavdeep Parhar 		CXGBE_UNIMPLEMENTED(__func__);
5687786099deSNavdeep Parhar 
5688786099deSNavdeep Parhar 	bzero(flowc, ETID_FLUSH_LEN16 * 16);
5689786099deSNavdeep Parhar 	flowc->op_to_nparams = htobe32(V_FW_WR_OP(FW_FLOWC_WR) |
5690786099deSNavdeep Parhar 	    V_FW_FLOWC_WR_NPARAMS(0) | F_FW_WR_COMPL);
5691786099deSNavdeep Parhar 	flowc->flowid_len16 = htobe32(V_FW_WR_LEN16(ETID_FLUSH_LEN16) |
5692786099deSNavdeep Parhar 	    V_FW_WR_FLOWID(cst->etid));
5693786099deSNavdeep Parhar 
5694786099deSNavdeep Parhar 	commit_wrq_wr(cst->eo_txq, flowc, &cookie);
5695786099deSNavdeep Parhar 
5696786099deSNavdeep Parhar 	cst->flags |= EO_FLUSH_RPL_PENDING;
5697786099deSNavdeep Parhar 	MPASS(cst->tx_credits >= ETID_FLUSH_LEN16);
5698786099deSNavdeep Parhar 	cst->tx_credits -= ETID_FLUSH_LEN16;
5699786099deSNavdeep Parhar 	cst->ncompl++;
5700786099deSNavdeep Parhar }
5701786099deSNavdeep Parhar 
5702786099deSNavdeep Parhar static void
5703786099deSNavdeep Parhar write_ethofld_wr(struct cxgbe_snd_tag *cst, struct fw_eth_tx_eo_wr *wr,
5704786099deSNavdeep Parhar     struct mbuf *m0, int compl)
5705786099deSNavdeep Parhar {
5706786099deSNavdeep Parhar 	struct cpl_tx_pkt_core *cpl;
5707786099deSNavdeep Parhar 	uint64_t ctrl1;
5708786099deSNavdeep Parhar 	uint32_t ctrl;	/* used in many unrelated places */
5709786099deSNavdeep Parhar 	int len16, pktlen, nsegs, immhdrs;
5710786099deSNavdeep Parhar 	caddr_t dst;
5711786099deSNavdeep Parhar 	uintptr_t p;
5712786099deSNavdeep Parhar 	struct ulptx_sgl *usgl;
5713786099deSNavdeep Parhar 	struct sglist sg;
5714786099deSNavdeep Parhar 	struct sglist_seg segs[38];	/* XXX: find real limit.  XXX: get off the stack */
5715786099deSNavdeep Parhar 
5716786099deSNavdeep Parhar 	mtx_assert(&cst->lock, MA_OWNED);
5717786099deSNavdeep Parhar 	M_ASSERTPKTHDR(m0);
5718786099deSNavdeep Parhar 	KASSERT(m0->m_pkthdr.l2hlen > 0 && m0->m_pkthdr.l3hlen > 0 &&
5719786099deSNavdeep Parhar 	    m0->m_pkthdr.l4hlen > 0,
5720786099deSNavdeep Parhar 	    ("%s: ethofld mbuf %p is missing header lengths", __func__, m0));
5721786099deSNavdeep Parhar 
5722786099deSNavdeep Parhar 	len16 = mbuf_eo_len16(m0);
5723786099deSNavdeep Parhar 	nsegs = mbuf_eo_nsegs(m0);
5724786099deSNavdeep Parhar 	pktlen = m0->m_pkthdr.len;
5725786099deSNavdeep Parhar 	ctrl = sizeof(struct cpl_tx_pkt_core);
5726786099deSNavdeep Parhar 	if (needs_tso(m0))
5727786099deSNavdeep Parhar 		ctrl += sizeof(struct cpl_tx_pkt_lso_core);
5728786099deSNavdeep Parhar 	immhdrs = m0->m_pkthdr.l2hlen + m0->m_pkthdr.l3hlen + m0->m_pkthdr.l4hlen;
5729786099deSNavdeep Parhar 	ctrl += immhdrs;
5730786099deSNavdeep Parhar 
5731786099deSNavdeep Parhar 	wr->op_immdlen = htobe32(V_FW_WR_OP(FW_ETH_TX_EO_WR) |
5732786099deSNavdeep Parhar 	    V_FW_ETH_TX_EO_WR_IMMDLEN(ctrl) | V_FW_WR_COMPL(!!compl));
5733786099deSNavdeep Parhar 	wr->equiq_to_len16 = htobe32(V_FW_WR_LEN16(len16) |
5734786099deSNavdeep Parhar 	    V_FW_WR_FLOWID(cst->etid));
5735786099deSNavdeep Parhar 	wr->r3 = 0;
57366933902dSNavdeep Parhar 	if (needs_udp_csum(m0)) {
57376933902dSNavdeep Parhar 		wr->u.udpseg.type = FW_ETH_TX_EO_TYPE_UDPSEG;
57386933902dSNavdeep Parhar 		wr->u.udpseg.ethlen = m0->m_pkthdr.l2hlen;
57396933902dSNavdeep Parhar 		wr->u.udpseg.iplen = htobe16(m0->m_pkthdr.l3hlen);
57406933902dSNavdeep Parhar 		wr->u.udpseg.udplen = m0->m_pkthdr.l4hlen;
57416933902dSNavdeep Parhar 		wr->u.udpseg.rtplen = 0;
57426933902dSNavdeep Parhar 		wr->u.udpseg.r4 = 0;
57436933902dSNavdeep Parhar 		wr->u.udpseg.mss = htobe16(pktlen - immhdrs);
57446933902dSNavdeep Parhar 		wr->u.udpseg.schedpktsize = wr->u.udpseg.mss;
57456933902dSNavdeep Parhar 		wr->u.udpseg.plen = htobe32(pktlen - immhdrs);
57466933902dSNavdeep Parhar 		cpl = (void *)(wr + 1);
57476933902dSNavdeep Parhar 	} else {
57486933902dSNavdeep Parhar 		MPASS(needs_tcp_csum(m0));
5749786099deSNavdeep Parhar 		wr->u.tcpseg.type = FW_ETH_TX_EO_TYPE_TCPSEG;
5750786099deSNavdeep Parhar 		wr->u.tcpseg.ethlen = m0->m_pkthdr.l2hlen;
5751786099deSNavdeep Parhar 		wr->u.tcpseg.iplen = htobe16(m0->m_pkthdr.l3hlen);
5752786099deSNavdeep Parhar 		wr->u.tcpseg.tcplen = m0->m_pkthdr.l4hlen;
5753786099deSNavdeep Parhar 		wr->u.tcpseg.tsclk_tsoff = mbuf_eo_tsclk_tsoff(m0);
5754786099deSNavdeep Parhar 		wr->u.tcpseg.r4 = 0;
5755786099deSNavdeep Parhar 		wr->u.tcpseg.r5 = 0;
5756786099deSNavdeep Parhar 		wr->u.tcpseg.plen = htobe32(pktlen - immhdrs);
5757786099deSNavdeep Parhar 
5758786099deSNavdeep Parhar 		if (needs_tso(m0)) {
5759786099deSNavdeep Parhar 			struct cpl_tx_pkt_lso_core *lso = (void *)(wr + 1);
5760786099deSNavdeep Parhar 
5761786099deSNavdeep Parhar 			wr->u.tcpseg.mss = htobe16(m0->m_pkthdr.tso_segsz);
5762786099deSNavdeep Parhar 
57636933902dSNavdeep Parhar 			ctrl = V_LSO_OPCODE(CPL_TX_PKT_LSO) |
57646933902dSNavdeep Parhar 			    F_LSO_FIRST_SLICE | F_LSO_LAST_SLICE |
57656933902dSNavdeep Parhar 			    V_LSO_IPHDR_LEN(m0->m_pkthdr.l3hlen >> 2) |
57666933902dSNavdeep Parhar 			    V_LSO_TCPHDR_LEN(m0->m_pkthdr.l4hlen >> 2);
5767786099deSNavdeep Parhar 			if (m0->m_pkthdr.l2hlen == sizeof(struct ether_vlan_header))
5768786099deSNavdeep Parhar 				ctrl |= V_LSO_ETHHDR_LEN(1);
5769786099deSNavdeep Parhar 			if (m0->m_pkthdr.l3hlen == sizeof(struct ip6_hdr))
5770786099deSNavdeep Parhar 				ctrl |= F_LSO_IPV6;
5771786099deSNavdeep Parhar 			lso->lso_ctrl = htobe32(ctrl);
5772786099deSNavdeep Parhar 			lso->ipid_ofst = htobe16(0);
5773786099deSNavdeep Parhar 			lso->mss = htobe16(m0->m_pkthdr.tso_segsz);
5774786099deSNavdeep Parhar 			lso->seqno_offset = htobe32(0);
5775786099deSNavdeep Parhar 			lso->len = htobe32(pktlen);
5776786099deSNavdeep Parhar 
5777786099deSNavdeep Parhar 			cpl = (void *)(lso + 1);
5778786099deSNavdeep Parhar 		} else {
5779786099deSNavdeep Parhar 			wr->u.tcpseg.mss = htobe16(0xffff);
5780786099deSNavdeep Parhar 			cpl = (void *)(wr + 1);
5781786099deSNavdeep Parhar 		}
57826933902dSNavdeep Parhar 	}
5783786099deSNavdeep Parhar 
5784786099deSNavdeep Parhar 	/* Checksum offload must be requested for ethofld. */
5785786099deSNavdeep Parhar 	ctrl1 = 0;
5786786099deSNavdeep Parhar 	MPASS(needs_l4_csum(m0));
5787786099deSNavdeep Parhar 
5788786099deSNavdeep Parhar 	/* VLAN tag insertion */
5789786099deSNavdeep Parhar 	if (needs_vlan_insertion(m0)) {
5790786099deSNavdeep Parhar 		ctrl1 |= F_TXPKT_VLAN_VLD |
5791786099deSNavdeep Parhar 		    V_TXPKT_VLAN(m0->m_pkthdr.ether_vtag);
5792786099deSNavdeep Parhar 	}
5793786099deSNavdeep Parhar 
5794786099deSNavdeep Parhar 	/* CPL header */
5795786099deSNavdeep Parhar 	cpl->ctrl0 = cst->ctrl0;
5796786099deSNavdeep Parhar 	cpl->pack = 0;
5797786099deSNavdeep Parhar 	cpl->len = htobe16(pktlen);
5798786099deSNavdeep Parhar 	cpl->ctrl1 = htobe64(ctrl1);
5799786099deSNavdeep Parhar 
58006933902dSNavdeep Parhar 	/* Copy Ethernet, IP & TCP/UDP hdrs as immediate data */
5801786099deSNavdeep Parhar 	p = (uintptr_t)(cpl + 1);
5802786099deSNavdeep Parhar 	m_copydata(m0, 0, immhdrs, (void *)p);
5803786099deSNavdeep Parhar 
5804786099deSNavdeep Parhar 	/* SGL */
5805786099deSNavdeep Parhar 	dst = (void *)(cpl + 1);
5806786099deSNavdeep Parhar 	if (nsegs > 0) {
5807786099deSNavdeep Parhar 		int i, pad;
5808786099deSNavdeep Parhar 
5809786099deSNavdeep Parhar 		/* zero-pad upto next 16Byte boundary, if not 16Byte aligned */
5810786099deSNavdeep Parhar 		p += immhdrs;
5811786099deSNavdeep Parhar 		pad = 16 - (immhdrs & 0xf);
5812786099deSNavdeep Parhar 		bzero((void *)p, pad);
5813786099deSNavdeep Parhar 
5814786099deSNavdeep Parhar 		usgl = (void *)(p + pad);
5815786099deSNavdeep Parhar 		usgl->cmd_nsge = htobe32(V_ULPTX_CMD(ULP_TX_SC_DSGL) |
5816786099deSNavdeep Parhar 		    V_ULPTX_NSGE(nsegs));
5817786099deSNavdeep Parhar 
5818786099deSNavdeep Parhar 		sglist_init(&sg, nitems(segs), segs);
5819786099deSNavdeep Parhar 		for (; m0 != NULL; m0 = m0->m_next) {
5820786099deSNavdeep Parhar 			if (__predict_false(m0->m_len == 0))
5821786099deSNavdeep Parhar 				continue;
5822786099deSNavdeep Parhar 			if (immhdrs >= m0->m_len) {
5823786099deSNavdeep Parhar 				immhdrs -= m0->m_len;
5824786099deSNavdeep Parhar 				continue;
5825786099deSNavdeep Parhar 			}
5826786099deSNavdeep Parhar 
5827786099deSNavdeep Parhar 			sglist_append(&sg, mtod(m0, char *) + immhdrs,
5828786099deSNavdeep Parhar 			    m0->m_len - immhdrs);
5829786099deSNavdeep Parhar 			immhdrs = 0;
5830786099deSNavdeep Parhar 		}
5831786099deSNavdeep Parhar 		MPASS(sg.sg_nseg == nsegs);
5832786099deSNavdeep Parhar 
5833786099deSNavdeep Parhar 		/*
5834786099deSNavdeep Parhar 		 * Zero pad last 8B in case the WR doesn't end on a 16B
5835786099deSNavdeep Parhar 		 * boundary.
5836786099deSNavdeep Parhar 		 */
5837786099deSNavdeep Parhar 		*(uint64_t *)((char *)wr + len16 * 16 - 8) = 0;
5838786099deSNavdeep Parhar 
5839786099deSNavdeep Parhar 		usgl->len0 = htobe32(segs[0].ss_len);
5840786099deSNavdeep Parhar 		usgl->addr0 = htobe64(segs[0].ss_paddr);
5841786099deSNavdeep Parhar 		for (i = 0; i < nsegs - 1; i++) {
5842786099deSNavdeep Parhar 			usgl->sge[i / 2].len[i & 1] = htobe32(segs[i + 1].ss_len);
5843786099deSNavdeep Parhar 			usgl->sge[i / 2].addr[i & 1] = htobe64(segs[i + 1].ss_paddr);
5844786099deSNavdeep Parhar 		}
5845786099deSNavdeep Parhar 		if (i & 1)
5846786099deSNavdeep Parhar 			usgl->sge[i / 2].len[1] = htobe32(0);
5847786099deSNavdeep Parhar 	}
5848786099deSNavdeep Parhar 
5849786099deSNavdeep Parhar }
5850786099deSNavdeep Parhar 
5851786099deSNavdeep Parhar static void
5852786099deSNavdeep Parhar ethofld_tx(struct cxgbe_snd_tag *cst)
5853786099deSNavdeep Parhar {
5854786099deSNavdeep Parhar 	struct mbuf *m;
5855786099deSNavdeep Parhar 	struct wrq_cookie cookie;
5856786099deSNavdeep Parhar 	int next_credits, compl;
5857786099deSNavdeep Parhar 	struct fw_eth_tx_eo_wr *wr;
5858786099deSNavdeep Parhar 
5859786099deSNavdeep Parhar 	mtx_assert(&cst->lock, MA_OWNED);
5860786099deSNavdeep Parhar 
5861786099deSNavdeep Parhar 	while ((m = mbufq_first(&cst->pending_tx)) != NULL) {
5862786099deSNavdeep Parhar 		M_ASSERTPKTHDR(m);
5863786099deSNavdeep Parhar 
5864786099deSNavdeep Parhar 		/* How many len16 credits do we need to send this mbuf. */
5865786099deSNavdeep Parhar 		next_credits = mbuf_eo_len16(m);
5866786099deSNavdeep Parhar 		MPASS(next_credits > 0);
5867786099deSNavdeep Parhar 		if (next_credits > cst->tx_credits) {
5868786099deSNavdeep Parhar 			/*
5869786099deSNavdeep Parhar 			 * Tx will make progress eventually because there is at
5870786099deSNavdeep Parhar 			 * least one outstanding fw4_ack that will return
5871786099deSNavdeep Parhar 			 * credits and kick the tx.
5872786099deSNavdeep Parhar 			 */
5873786099deSNavdeep Parhar 			MPASS(cst->ncompl > 0);
5874786099deSNavdeep Parhar 			return;
5875786099deSNavdeep Parhar 		}
5876786099deSNavdeep Parhar 		wr = start_wrq_wr(cst->eo_txq, next_credits, &cookie);
5877786099deSNavdeep Parhar 		if (__predict_false(wr == NULL)) {
5878786099deSNavdeep Parhar 			/* XXX: wishful thinking, not a real assertion. */
5879786099deSNavdeep Parhar 			MPASS(cst->ncompl > 0);
5880786099deSNavdeep Parhar 			return;
5881786099deSNavdeep Parhar 		}
5882786099deSNavdeep Parhar 		cst->tx_credits -= next_credits;
5883786099deSNavdeep Parhar 		cst->tx_nocompl += next_credits;
5884786099deSNavdeep Parhar 		compl = cst->ncompl == 0 || cst->tx_nocompl >= cst->tx_total / 2;
5885786099deSNavdeep Parhar 		ETHER_BPF_MTAP(cst->com.ifp, m);
5886786099deSNavdeep Parhar 		write_ethofld_wr(cst, wr, m, compl);
5887786099deSNavdeep Parhar 		commit_wrq_wr(cst->eo_txq, wr, &cookie);
5888786099deSNavdeep Parhar 		if (compl) {
5889786099deSNavdeep Parhar 			cst->ncompl++;
5890786099deSNavdeep Parhar 			cst->tx_nocompl	= 0;
5891786099deSNavdeep Parhar 		}
5892786099deSNavdeep Parhar 		(void) mbufq_dequeue(&cst->pending_tx);
5893786099deSNavdeep Parhar 		mbufq_enqueue(&cst->pending_fwack, m);
5894786099deSNavdeep Parhar 	}
5895786099deSNavdeep Parhar }
5896786099deSNavdeep Parhar 
5897786099deSNavdeep Parhar int
5898786099deSNavdeep Parhar ethofld_transmit(struct ifnet *ifp, struct mbuf *m0)
5899786099deSNavdeep Parhar {
5900786099deSNavdeep Parhar 	struct cxgbe_snd_tag *cst;
5901786099deSNavdeep Parhar 	int rc;
5902786099deSNavdeep Parhar 
5903786099deSNavdeep Parhar 	MPASS(m0->m_nextpkt == NULL);
5904786099deSNavdeep Parhar 	MPASS(m0->m_pkthdr.snd_tag != NULL);
5905786099deSNavdeep Parhar 	cst = mst_to_cst(m0->m_pkthdr.snd_tag);
5906786099deSNavdeep Parhar 
5907786099deSNavdeep Parhar 	mtx_lock(&cst->lock);
5908786099deSNavdeep Parhar 	MPASS(cst->flags & EO_SND_TAG_REF);
5909786099deSNavdeep Parhar 
5910786099deSNavdeep Parhar 	if (__predict_false(cst->flags & EO_FLOWC_PENDING)) {
5911786099deSNavdeep Parhar 		struct vi_info *vi = ifp->if_softc;
5912786099deSNavdeep Parhar 		struct port_info *pi = vi->pi;
5913786099deSNavdeep Parhar 		struct adapter *sc = pi->adapter;
5914786099deSNavdeep Parhar 		const uint32_t rss_mask = vi->rss_size - 1;
5915786099deSNavdeep Parhar 		uint32_t rss_hash;
5916786099deSNavdeep Parhar 
5917786099deSNavdeep Parhar 		cst->eo_txq = &sc->sge.ofld_txq[vi->first_ofld_txq];
5918786099deSNavdeep Parhar 		if (M_HASHTYPE_ISHASH(m0))
5919786099deSNavdeep Parhar 			rss_hash = m0->m_pkthdr.flowid;
5920786099deSNavdeep Parhar 		else
5921786099deSNavdeep Parhar 			rss_hash = arc4random();
5922786099deSNavdeep Parhar 		/* We assume RSS hashing */
5923786099deSNavdeep Parhar 		cst->iqid = vi->rss[rss_hash & rss_mask];
5924786099deSNavdeep Parhar 		cst->eo_txq += rss_hash % vi->nofldtxq;
5925786099deSNavdeep Parhar 		rc = send_etid_flowc_wr(cst, pi, vi);
5926786099deSNavdeep Parhar 		if (rc != 0)
5927786099deSNavdeep Parhar 			goto done;
5928786099deSNavdeep Parhar 	}
5929786099deSNavdeep Parhar 
5930786099deSNavdeep Parhar 	if (__predict_false(cst->plen + m0->m_pkthdr.len > eo_max_backlog)) {
5931786099deSNavdeep Parhar 		rc = ENOBUFS;
5932786099deSNavdeep Parhar 		goto done;
5933786099deSNavdeep Parhar 	}
5934786099deSNavdeep Parhar 
5935786099deSNavdeep Parhar 	mbufq_enqueue(&cst->pending_tx, m0);
5936786099deSNavdeep Parhar 	cst->plen += m0->m_pkthdr.len;
5937786099deSNavdeep Parhar 
5938786099deSNavdeep Parhar 	ethofld_tx(cst);
5939786099deSNavdeep Parhar 	rc = 0;
5940786099deSNavdeep Parhar done:
5941786099deSNavdeep Parhar 	mtx_unlock(&cst->lock);
5942786099deSNavdeep Parhar 	if (__predict_false(rc != 0))
5943786099deSNavdeep Parhar 		m_freem(m0);
5944786099deSNavdeep Parhar 	return (rc);
5945786099deSNavdeep Parhar }
5946786099deSNavdeep Parhar 
5947786099deSNavdeep Parhar static int
5948786099deSNavdeep Parhar ethofld_fw4_ack(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m0)
5949786099deSNavdeep Parhar {
5950786099deSNavdeep Parhar 	struct adapter *sc = iq->adapter;
5951786099deSNavdeep Parhar 	const struct cpl_fw4_ack *cpl = (const void *)(rss + 1);
5952786099deSNavdeep Parhar 	struct mbuf *m;
5953786099deSNavdeep Parhar 	u_int etid = G_CPL_FW4_ACK_FLOWID(be32toh(OPCODE_TID(cpl)));
5954786099deSNavdeep Parhar 	struct cxgbe_snd_tag *cst;
5955786099deSNavdeep Parhar 	uint8_t credits = cpl->credits;
5956786099deSNavdeep Parhar 
5957786099deSNavdeep Parhar 	cst = lookup_etid(sc, etid);
5958786099deSNavdeep Parhar 	mtx_lock(&cst->lock);
5959786099deSNavdeep Parhar 	if (__predict_false(cst->flags & EO_FLOWC_RPL_PENDING)) {
5960786099deSNavdeep Parhar 		MPASS(credits >= ETID_FLOWC_LEN16);
5961786099deSNavdeep Parhar 		credits -= ETID_FLOWC_LEN16;
5962786099deSNavdeep Parhar 		cst->flags &= ~EO_FLOWC_RPL_PENDING;
5963786099deSNavdeep Parhar 	}
5964786099deSNavdeep Parhar 
5965786099deSNavdeep Parhar 	KASSERT(cst->ncompl > 0,
5966786099deSNavdeep Parhar 	    ("%s: etid %u (%p) wasn't expecting completion.",
5967786099deSNavdeep Parhar 	    __func__, etid, cst));
5968786099deSNavdeep Parhar 	cst->ncompl--;
5969786099deSNavdeep Parhar 
5970786099deSNavdeep Parhar 	while (credits > 0) {
5971786099deSNavdeep Parhar 		m = mbufq_dequeue(&cst->pending_fwack);
5972786099deSNavdeep Parhar 		if (__predict_false(m == NULL)) {
5973786099deSNavdeep Parhar 			/*
5974786099deSNavdeep Parhar 			 * The remaining credits are for the final flush that
5975786099deSNavdeep Parhar 			 * was issued when the tag was freed by the kernel.
5976786099deSNavdeep Parhar 			 */
5977786099deSNavdeep Parhar 			MPASS((cst->flags &
5978786099deSNavdeep Parhar 			    (EO_FLUSH_RPL_PENDING | EO_SND_TAG_REF)) ==
5979786099deSNavdeep Parhar 			    EO_FLUSH_RPL_PENDING);
5980786099deSNavdeep Parhar 			MPASS(credits == ETID_FLUSH_LEN16);
5981786099deSNavdeep Parhar 			MPASS(cst->tx_credits + cpl->credits == cst->tx_total);
5982786099deSNavdeep Parhar 			MPASS(cst->ncompl == 0);
5983786099deSNavdeep Parhar 
5984786099deSNavdeep Parhar 			cst->flags &= ~EO_FLUSH_RPL_PENDING;
5985786099deSNavdeep Parhar 			cst->tx_credits += cpl->credits;
5986786099deSNavdeep Parhar freetag:
5987786099deSNavdeep Parhar 			cxgbe_snd_tag_free_locked(cst);
5988786099deSNavdeep Parhar 			return (0);	/* cst is gone. */
5989786099deSNavdeep Parhar 		}
5990786099deSNavdeep Parhar 		KASSERT(m != NULL,
5991786099deSNavdeep Parhar 		    ("%s: too many credits (%u, %u)", __func__, cpl->credits,
5992786099deSNavdeep Parhar 		    credits));
5993786099deSNavdeep Parhar 		KASSERT(credits >= mbuf_eo_len16(m),
5994786099deSNavdeep Parhar 		    ("%s: too few credits (%u, %u, %u)", __func__,
5995786099deSNavdeep Parhar 		    cpl->credits, credits, mbuf_eo_len16(m)));
5996786099deSNavdeep Parhar 		credits -= mbuf_eo_len16(m);
5997786099deSNavdeep Parhar 		cst->plen -= m->m_pkthdr.len;
5998786099deSNavdeep Parhar 		m_freem(m);
5999786099deSNavdeep Parhar 	}
6000786099deSNavdeep Parhar 
6001786099deSNavdeep Parhar 	cst->tx_credits += cpl->credits;
6002786099deSNavdeep Parhar 	MPASS(cst->tx_credits <= cst->tx_total);
6003786099deSNavdeep Parhar 
6004786099deSNavdeep Parhar 	m = mbufq_first(&cst->pending_tx);
6005786099deSNavdeep Parhar 	if (m != NULL && cst->tx_credits >= mbuf_eo_len16(m))
6006786099deSNavdeep Parhar 		ethofld_tx(cst);
6007786099deSNavdeep Parhar 
6008786099deSNavdeep Parhar 	if (__predict_false((cst->flags & EO_SND_TAG_REF) == 0) &&
6009786099deSNavdeep Parhar 	    cst->ncompl == 0) {
6010786099deSNavdeep Parhar 		if (cst->tx_credits == cst->tx_total)
6011786099deSNavdeep Parhar 			goto freetag;
6012786099deSNavdeep Parhar 		else {
6013786099deSNavdeep Parhar 			MPASS((cst->flags & EO_FLUSH_RPL_PENDING) == 0);
6014786099deSNavdeep Parhar 			send_etid_flush_wr(cst);
6015786099deSNavdeep Parhar 		}
6016786099deSNavdeep Parhar 	}
6017786099deSNavdeep Parhar 
6018786099deSNavdeep Parhar 	mtx_unlock(&cst->lock);
6019786099deSNavdeep Parhar 
6020786099deSNavdeep Parhar 	return (0);
6021786099deSNavdeep Parhar }
6022786099deSNavdeep Parhar #endif
6023