xref: /linux/drivers/net/ethernet/sfc/ef100_tx.c (revision f84754dbc55e3abd8241e3038b615af65c745f47)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /****************************************************************************
3  * Driver for Solarflare network controllers and boards
4  * Copyright 2018 Solarflare Communications Inc.
5  * Copyright 2019-2020 Xilinx Inc.
6  *
7  * This program is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License version 2 as published
9  * by the Free Software Foundation, incorporated herein by reference.
10  */
11 
12 #include <net/ip6_checksum.h>
13 
14 #include "net_driver.h"
15 #include "tx_common.h"
16 #include "nic_common.h"
17 #include "mcdi_functions.h"
18 #include "ef100_regs.h"
19 #include "io.h"
20 #include "ef100_tx.h"
21 #include "ef100_nic.h"
22 
23 int ef100_tx_probe(struct efx_tx_queue *tx_queue)
24 {
25 	/* Allocate an extra descriptor for the QMDA status completion entry */
26 	return efx_nic_alloc_buffer(tx_queue->efx, &tx_queue->txd.buf,
27 				    (tx_queue->ptr_mask + 2) *
28 				    sizeof(efx_oword_t),
29 				    GFP_KERNEL);
30 }
31 
32 void ef100_tx_init(struct efx_tx_queue *tx_queue)
33 {
34 	/* must be the inverse of lookup in efx_get_tx_channel */
35 	tx_queue->core_txq =
36 		netdev_get_tx_queue(tx_queue->efx->net_dev,
37 				    tx_queue->channel->channel -
38 				    tx_queue->efx->tx_channel_offset);
39 
40 	/* This value is purely documentational; as EF100 never passes through
41 	 * the switch statement in tx.c:__efx_enqueue_skb(), that switch does
42 	 * not handle case 3.  EF100's TSOv3 descriptors are generated by
43 	 * ef100_make_tso_desc().
44 	 * Meanwhile, all efx_mcdi_tx_init() cares about is that it's not 2.
45 	 */
46 	tx_queue->tso_version = 3;
47 	if (efx_mcdi_tx_init(tx_queue))
48 		netdev_WARN(tx_queue->efx->net_dev,
49 			    "failed to initialise TXQ %d\n", tx_queue->queue);
50 }
51 
52 static bool ef100_tx_can_tso(struct efx_tx_queue *tx_queue, struct sk_buff *skb)
53 {
54 	struct efx_nic *efx = tx_queue->efx;
55 	struct ef100_nic_data *nic_data;
56 	struct efx_tx_buffer *buffer;
57 	size_t header_len;
58 	u32 mss;
59 
60 	nic_data = efx->nic_data;
61 
62 	if (!skb_is_gso_tcp(skb))
63 		return false;
64 	if (!(efx->net_dev->features & NETIF_F_TSO))
65 		return false;
66 
67 	mss = skb_shinfo(skb)->gso_size;
68 	if (unlikely(mss < 4)) {
69 		WARN_ONCE(1, "MSS of %u is too small for TSO\n", mss);
70 		return false;
71 	}
72 
73 	header_len = efx_tx_tso_header_length(skb);
74 	if (header_len > nic_data->tso_max_hdr_len)
75 		return false;
76 
77 	if (skb_shinfo(skb)->gso_segs > nic_data->tso_max_payload_num_segs) {
78 		/* net_dev->gso_max_segs should've caught this */
79 		WARN_ON_ONCE(1);
80 		return false;
81 	}
82 
83 	if (skb->data_len / mss > nic_data->tso_max_frames)
84 		return false;
85 
86 	/* net_dev->gso_max_size should've caught this */
87 	if (WARN_ON_ONCE(skb->data_len > nic_data->tso_max_payload_len))
88 		return false;
89 
90 	/* Reserve an empty buffer for the TSO V3 descriptor.
91 	 * Convey the length of the header since we already know it.
92 	 */
93 	buffer = efx_tx_queue_get_insert_buffer(tx_queue);
94 	buffer->flags = EFX_TX_BUF_TSO_V3 | EFX_TX_BUF_CONT;
95 	buffer->len = header_len;
96 	buffer->unmap_len = 0;
97 	buffer->skb = skb;
98 	++tx_queue->insert_count;
99 	return true;
100 }
101 
102 static efx_oword_t *ef100_tx_desc(struct efx_tx_queue *tx_queue, unsigned int index)
103 {
104 	if (likely(tx_queue->txd.buf.addr))
105 		return ((efx_oword_t *)tx_queue->txd.buf.addr) + index;
106 	else
107 		return NULL;
108 }
109 
110 static void ef100_notify_tx_desc(struct efx_tx_queue *tx_queue)
111 {
112 	unsigned int write_ptr;
113 	efx_dword_t reg;
114 
115 	tx_queue->xmit_pending = false;
116 
117 	if (unlikely(tx_queue->notify_count == tx_queue->write_count))
118 		return;
119 
120 	write_ptr = tx_queue->write_count & tx_queue->ptr_mask;
121 	/* The write pointer goes into the high word */
122 	EFX_POPULATE_DWORD_1(reg, ERF_GZ_TX_RING_PIDX, write_ptr);
123 	efx_writed_page(tx_queue->efx, &reg,
124 			ER_GZ_TX_RING_DOORBELL, tx_queue->queue);
125 	tx_queue->notify_count = tx_queue->write_count;
126 }
127 
128 static void ef100_tx_push_buffers(struct efx_tx_queue *tx_queue)
129 {
130 	ef100_notify_tx_desc(tx_queue);
131 	++tx_queue->pushes;
132 }
133 
134 static void ef100_set_tx_csum_partial(const struct sk_buff *skb,
135 				      struct efx_tx_buffer *buffer, efx_oword_t *txd)
136 {
137 	efx_oword_t csum;
138 	int csum_start;
139 
140 	if (!skb || skb->ip_summed != CHECKSUM_PARTIAL)
141 		return;
142 
143 	/* skb->csum_start has the offset from head, but we need the offset
144 	 * from data.
145 	 */
146 	csum_start = skb_checksum_start_offset(skb);
147 	EFX_POPULATE_OWORD_3(csum,
148 			     ESF_GZ_TX_SEND_CSO_PARTIAL_EN, 1,
149 			     ESF_GZ_TX_SEND_CSO_PARTIAL_START_W,
150 			     csum_start >> 1,
151 			     ESF_GZ_TX_SEND_CSO_PARTIAL_CSUM_W,
152 			     skb->csum_offset >> 1);
153 	EFX_OR_OWORD(*txd, *txd, csum);
154 }
155 
156 static void ef100_set_tx_hw_vlan(const struct sk_buff *skb, efx_oword_t *txd)
157 {
158 	u16 vlan_tci = skb_vlan_tag_get(skb);
159 	efx_oword_t vlan;
160 
161 	EFX_POPULATE_OWORD_2(vlan,
162 			     ESF_GZ_TX_SEND_VLAN_INSERT_EN, 1,
163 			     ESF_GZ_TX_SEND_VLAN_INSERT_TCI, vlan_tci);
164 	EFX_OR_OWORD(*txd, *txd, vlan);
165 }
166 
167 static void ef100_make_send_desc(struct efx_nic *efx,
168 				 const struct sk_buff *skb,
169 				 struct efx_tx_buffer *buffer, efx_oword_t *txd,
170 				 unsigned int segment_count)
171 {
172 	/* TX send descriptor */
173 	EFX_POPULATE_OWORD_3(*txd,
174 			     ESF_GZ_TX_SEND_NUM_SEGS, segment_count,
175 			     ESF_GZ_TX_SEND_LEN, buffer->len,
176 			     ESF_GZ_TX_SEND_ADDR, buffer->dma_addr);
177 
178 	if (likely(efx->net_dev->features & NETIF_F_HW_CSUM))
179 		ef100_set_tx_csum_partial(skb, buffer, txd);
180 	if (efx->net_dev->features & NETIF_F_HW_VLAN_CTAG_TX &&
181 	    skb && skb_vlan_tag_present(skb))
182 		ef100_set_tx_hw_vlan(skb, txd);
183 }
184 
185 static void ef100_make_tso_desc(struct efx_nic *efx,
186 				const struct sk_buff *skb,
187 				struct efx_tx_buffer *buffer, efx_oword_t *txd,
188 				unsigned int segment_count)
189 {
190 	bool gso_partial = skb_shinfo(skb)->gso_type & SKB_GSO_PARTIAL;
191 	unsigned int len, ip_offset, tcp_offset, payload_segs;
192 	u32 mangleid = ESE_GZ_TX_DESC_IP4_ID_INC_MOD16;
193 	unsigned int outer_ip_offset, outer_l4_offset;
194 	u16 vlan_tci = skb_vlan_tag_get(skb);
195 	u32 mss = skb_shinfo(skb)->gso_size;
196 	bool encap = skb->encapsulation;
197 	u16 vlan_enable = 0;
198 	struct tcphdr *tcp;
199 	u32 paylen;
200 
201 	if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_FIXEDID)
202 		mangleid = ESE_GZ_TX_DESC_IP4_ID_NO_OP;
203 	if (efx->net_dev->features & NETIF_F_HW_VLAN_CTAG_TX)
204 		vlan_enable = skb_vlan_tag_present(skb);
205 
206 	len = skb->len - buffer->len;
207 	/* We use 1 for the TSO descriptor and 1 for the header */
208 	payload_segs = segment_count - 2;
209 	if (encap) {
210 		outer_ip_offset = skb_network_offset(skb);
211 		outer_l4_offset = skb_transport_offset(skb);
212 		ip_offset = skb_inner_network_offset(skb);
213 		tcp_offset = skb_inner_transport_offset(skb);
214 	} else {
215 		ip_offset =  skb_network_offset(skb);
216 		tcp_offset = skb_transport_offset(skb);
217 		outer_ip_offset = outer_l4_offset = 0;
218 	}
219 
220 	/* subtract TCP payload length from inner checksum */
221 	tcp = (void *)skb->data + tcp_offset;
222 	paylen = skb->len - tcp_offset;
223 	csum_replace_by_diff(&tcp->check, (__force __wsum)htonl(paylen));
224 
225 	EFX_POPULATE_OWORD_17(*txd,
226 			      ESF_GZ_TX_DESC_TYPE, ESE_GZ_TX_DESC_TYPE_TSO,
227 			      ESF_GZ_TX_TSO_MSS, mss,
228 			      ESF_GZ_TX_TSO_HDR_NUM_SEGS, 1,
229 			      ESF_GZ_TX_TSO_PAYLOAD_NUM_SEGS, payload_segs,
230 			      ESF_GZ_TX_TSO_HDR_LEN_W, buffer->len >> 1,
231 			      ESF_GZ_TX_TSO_PAYLOAD_LEN, len,
232 			      ESF_GZ_TX_TSO_CSO_INNER_L4, 1,
233 			      ESF_GZ_TX_TSO_INNER_L3_OFF_W, ip_offset >> 1,
234 			      ESF_GZ_TX_TSO_INNER_L4_OFF_W, tcp_offset >> 1,
235 			      ESF_GZ_TX_TSO_ED_INNER_IP4_ID, mangleid,
236 			      ESF_GZ_TX_TSO_ED_INNER_IP_LEN, 1,
237 			      ESF_GZ_TX_TSO_OUTER_L3_OFF_W, outer_ip_offset >> 1,
238 			      ESF_GZ_TX_TSO_OUTER_L4_OFF_W, outer_l4_offset >> 1,
239 			      ESF_GZ_TX_TSO_ED_OUTER_UDP_LEN, encap && !gso_partial,
240 			      ESF_GZ_TX_TSO_ED_OUTER_IP4_ID, encap ? mangleid :
241 								     ESE_GZ_TX_DESC_IP4_ID_NO_OP,
242 			      ESF_GZ_TX_TSO_VLAN_INSERT_EN, vlan_enable,
243 			      ESF_GZ_TX_TSO_VLAN_INSERT_TCI, vlan_tci
244 		);
245 }
246 
247 static void ef100_tx_make_descriptors(struct efx_tx_queue *tx_queue,
248 				      const struct sk_buff *skb,
249 				      unsigned int segment_count)
250 {
251 	unsigned int old_write_count = tx_queue->write_count;
252 	unsigned int new_write_count = old_write_count;
253 	struct efx_tx_buffer *buffer;
254 	unsigned int next_desc_type;
255 	unsigned int write_ptr;
256 	efx_oword_t *txd;
257 	unsigned int nr_descs = tx_queue->insert_count - old_write_count;
258 
259 	if (unlikely(nr_descs == 0))
260 		return;
261 
262 	if (segment_count)
263 		next_desc_type = ESE_GZ_TX_DESC_TYPE_TSO;
264 	else
265 		next_desc_type = ESE_GZ_TX_DESC_TYPE_SEND;
266 
267 	/* if it's a raw write (such as XDP) then always SEND single frames */
268 	if (!skb)
269 		nr_descs = 1;
270 
271 	do {
272 		write_ptr = new_write_count & tx_queue->ptr_mask;
273 		buffer = &tx_queue->buffer[write_ptr];
274 		txd = ef100_tx_desc(tx_queue, write_ptr);
275 		++new_write_count;
276 
277 		/* Create TX descriptor ring entry */
278 		tx_queue->packet_write_count = new_write_count;
279 
280 		switch (next_desc_type) {
281 		case ESE_GZ_TX_DESC_TYPE_SEND:
282 			ef100_make_send_desc(tx_queue->efx, skb,
283 					     buffer, txd, nr_descs);
284 			break;
285 		case ESE_GZ_TX_DESC_TYPE_TSO:
286 			/* TX TSO descriptor */
287 			WARN_ON_ONCE(!(buffer->flags & EFX_TX_BUF_TSO_V3));
288 			ef100_make_tso_desc(tx_queue->efx, skb,
289 					    buffer, txd, nr_descs);
290 			break;
291 		default:
292 			/* TX segment descriptor */
293 			EFX_POPULATE_OWORD_3(*txd,
294 					     ESF_GZ_TX_DESC_TYPE, ESE_GZ_TX_DESC_TYPE_SEG,
295 					     ESF_GZ_TX_SEG_LEN, buffer->len,
296 					     ESF_GZ_TX_SEG_ADDR, buffer->dma_addr);
297 		}
298 		/* if it's a raw write (such as XDP) then always SEND */
299 		next_desc_type = skb ? ESE_GZ_TX_DESC_TYPE_SEG :
300 				       ESE_GZ_TX_DESC_TYPE_SEND;
301 
302 	} while (new_write_count != tx_queue->insert_count);
303 
304 	wmb(); /* Ensure descriptors are written before they are fetched */
305 
306 	tx_queue->write_count = new_write_count;
307 
308 	/* The write_count above must be updated before reading
309 	 * channel->holdoff_doorbell to avoid a race with the
310 	 * completion path, so ensure these operations are not
311 	 * re-ordered.  This also flushes the update of write_count
312 	 * back into the cache.
313 	 */
314 	smp_mb();
315 }
316 
317 void ef100_tx_write(struct efx_tx_queue *tx_queue)
318 {
319 	ef100_tx_make_descriptors(tx_queue, NULL, 0);
320 	ef100_tx_push_buffers(tx_queue);
321 }
322 
323 void ef100_ev_tx(struct efx_channel *channel, const efx_qword_t *p_event)
324 {
325 	unsigned int tx_done =
326 		EFX_QWORD_FIELD(*p_event, ESF_GZ_EV_TXCMPL_NUM_DESC);
327 	unsigned int qlabel =
328 		EFX_QWORD_FIELD(*p_event, ESF_GZ_EV_TXCMPL_Q_LABEL);
329 	struct efx_tx_queue *tx_queue =
330 		efx_channel_get_tx_queue(channel, qlabel);
331 	unsigned int tx_index = (tx_queue->read_count + tx_done - 1) &
332 				tx_queue->ptr_mask;
333 
334 	efx_xmit_done(tx_queue, tx_index);
335 }
336 
337 /* Add a socket buffer to a TX queue
338  *
339  * You must hold netif_tx_lock() to call this function.
340  *
341  * Returns 0 on success, error code otherwise. In case of an error this
342  * function will free the SKB.
343  */
344 int ef100_enqueue_skb(struct efx_tx_queue *tx_queue, struct sk_buff *skb)
345 {
346 	unsigned int old_insert_count = tx_queue->insert_count;
347 	struct efx_nic *efx = tx_queue->efx;
348 	bool xmit_more = netdev_xmit_more();
349 	unsigned int fill_level;
350 	unsigned int segments;
351 	int rc;
352 
353 	if (!tx_queue->buffer || !tx_queue->ptr_mask) {
354 		netif_stop_queue(efx->net_dev);
355 		dev_kfree_skb_any(skb);
356 		return -ENODEV;
357 	}
358 
359 	segments = skb_is_gso(skb) ? skb_shinfo(skb)->gso_segs : 0;
360 	if (segments == 1)
361 		segments = 0;	/* Don't use TSO/GSO for a single segment. */
362 	if (segments && !ef100_tx_can_tso(tx_queue, skb)) {
363 		rc = efx_tx_tso_fallback(tx_queue, skb);
364 		tx_queue->tso_fallbacks++;
365 		if (rc)
366 			goto err;
367 		else
368 			return 0;
369 	}
370 
371 	/* Map for DMA and create descriptors */
372 	rc = efx_tx_map_data(tx_queue, skb, segments);
373 	if (rc)
374 		goto err;
375 	ef100_tx_make_descriptors(tx_queue, skb, segments);
376 
377 	fill_level = efx_channel_tx_old_fill_level(tx_queue->channel);
378 	if (fill_level > efx->txq_stop_thresh) {
379 		struct efx_tx_queue *txq2;
380 
381 		netif_tx_stop_queue(tx_queue->core_txq);
382 		/* Re-read after a memory barrier in case we've raced with
383 		 * the completion path. Otherwise there's a danger we'll never
384 		 * restart the queue if all completions have just happened.
385 		 */
386 		smp_mb();
387 		efx_for_each_channel_tx_queue(txq2, tx_queue->channel)
388 			txq2->old_read_count = READ_ONCE(txq2->read_count);
389 		fill_level = efx_channel_tx_old_fill_level(tx_queue->channel);
390 		if (fill_level < efx->txq_stop_thresh)
391 			netif_tx_start_queue(tx_queue->core_txq);
392 	}
393 
394 	tx_queue->xmit_pending = true;
395 
396 	/* If xmit_more then we don't need to push the doorbell, unless there
397 	 * are 256 descriptors already queued in which case we have to push to
398 	 * ensure we never push more than 256 at once.
399 	 */
400 	if (__netdev_tx_sent_queue(tx_queue->core_txq, skb->len, xmit_more) ||
401 	    tx_queue->write_count - tx_queue->notify_count > 255)
402 		ef100_tx_push_buffers(tx_queue);
403 
404 	if (segments) {
405 		tx_queue->tso_bursts++;
406 		tx_queue->tso_packets += segments;
407 		tx_queue->tx_packets  += segments;
408 	} else {
409 		tx_queue->tx_packets++;
410 	}
411 	return 0;
412 
413 err:
414 	efx_enqueue_unwind(tx_queue, old_insert_count);
415 	if (!IS_ERR_OR_NULL(skb))
416 		dev_kfree_skb_any(skb);
417 
418 	/* If we're not expecting another transmit and we had something to push
419 	 * on this queue then we need to push here to get the previous packets
420 	 * out.  We only enter this branch from before the xmit_more handling
421 	 * above, so xmit_pending still refers to the old state.
422 	 */
423 	if (tx_queue->xmit_pending && !xmit_more)
424 		ef100_tx_push_buffers(tx_queue);
425 	return rc;
426 }
427