1 /*
2 * Copyright (c) 2016, Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 */
32
33 #include <linux/dim.h>
34 #include <linux/debugfs.h>
35 #include <linux/mlx5/fs.h>
36 #include <net/switchdev.h>
37 #include <net/pkt_cls.h>
38 #include <net/act_api.h>
39 #include <net/devlink.h>
40 #include <net/ipv6_stubs.h>
41
42 #include "eswitch.h"
43 #include "en.h"
44 #include "en/dim.h"
45 #include "en_rep.h"
46 #include "en/params.h"
47 #include "en/txrx.h"
48 #include "en_tc.h"
49 #include "en/rep/tc.h"
50 #include "en/rep/neigh.h"
51 #include "en/rep/bridge.h"
52 #include "en/devlink.h"
53 #include "fs_core.h"
54 #include "lib/mlx5.h"
55 #include "lib/devcom.h"
56 #include "lib/vxlan.h"
57 #define CREATE_TRACE_POINTS
58 #include "diag/en_rep_tracepoint.h"
59 #include "diag/reporter_vnic.h"
60 #include "en_accel/ipsec.h"
61 #include "en/tc/int_port.h"
62 #include "en/ptp.h"
63 #include "en/fs_ethtool.h"
64
65 #define MLX5E_REP_PARAMS_DEF_LOG_SQ_SIZE \
66 max(0x7, MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE)
67 #define MLX5E_REP_PARAMS_DEF_NUM_CHANNELS 1
68
69 static const char mlx5e_rep_driver_name[] = "mlx5e_rep";
70
mlx5e_rep_get_drvinfo(struct net_device * dev,struct ethtool_drvinfo * drvinfo)71 static void mlx5e_rep_get_drvinfo(struct net_device *dev,
72 struct ethtool_drvinfo *drvinfo)
73 {
74 struct mlx5e_priv *priv = netdev_priv(dev);
75 struct mlx5_core_dev *mdev = priv->mdev;
76 int count;
77
78 strscpy(drvinfo->driver, mlx5e_rep_driver_name,
79 sizeof(drvinfo->driver));
80 count = snprintf(drvinfo->fw_version, sizeof(drvinfo->fw_version),
81 "%d.%d.%04d (%.16s)", fw_rev_maj(mdev),
82 fw_rev_min(mdev), fw_rev_sub(mdev), mdev->board_id);
83 if (count >= sizeof(drvinfo->fw_version))
84 snprintf(drvinfo->fw_version, sizeof(drvinfo->fw_version),
85 "%d.%d.%04d", fw_rev_maj(mdev),
86 fw_rev_min(mdev), fw_rev_sub(mdev));
87 }
88
89 static const struct counter_desc sw_rep_stats_desc[] = {
90 { MLX5E_DECLARE_STAT(struct mlx5e_sw_stats, rx_packets) },
91 { MLX5E_DECLARE_STAT(struct mlx5e_sw_stats, rx_bytes) },
92 { MLX5E_DECLARE_STAT(struct mlx5e_sw_stats, tx_packets) },
93 { MLX5E_DECLARE_STAT(struct mlx5e_sw_stats, tx_bytes) },
94 };
95
96 static const struct counter_desc vport_rep_stats_desc[] = {
97 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, vport_rx_packets) },
98 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, vport_rx_bytes) },
99 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, vport_tx_packets) },
100 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, vport_tx_bytes) },
101 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
102 rx_vport_rdma_unicast_packets) },
103 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, rx_vport_rdma_unicast_bytes) },
104 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
105 tx_vport_rdma_unicast_packets) },
106 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats, tx_vport_rdma_unicast_bytes) },
107 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
108 rx_vport_rdma_multicast_packets) },
109 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
110 rx_vport_rdma_multicast_bytes) },
111 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
112 tx_vport_rdma_multicast_packets) },
113 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
114 tx_vport_rdma_multicast_bytes) },
115 };
116
117 static const struct counter_desc vport_rep_loopback_stats_desc[] = {
118 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
119 vport_loopback_packets) },
120 { MLX5E_DECLARE_STAT(struct mlx5e_rep_stats,
121 vport_loopback_bytes) },
122 };
123
124 #define NUM_VPORT_REP_SW_COUNTERS ARRAY_SIZE(sw_rep_stats_desc)
125 #define NUM_VPORT_REP_HW_COUNTERS ARRAY_SIZE(vport_rep_stats_desc)
126 #define NUM_VPORT_REP_LOOPBACK_COUNTERS(dev) \
127 (MLX5_CAP_GEN(dev, vport_counter_local_loopback) ? \
128 ARRAY_SIZE(vport_rep_loopback_stats_desc) : 0)
129
MLX5E_DECLARE_STATS_GRP_OP_NUM_STATS(sw_rep)130 static MLX5E_DECLARE_STATS_GRP_OP_NUM_STATS(sw_rep)
131 {
132 return NUM_VPORT_REP_SW_COUNTERS;
133 }
134
MLX5E_DECLARE_STATS_GRP_OP_FILL_STRS(sw_rep)135 static MLX5E_DECLARE_STATS_GRP_OP_FILL_STRS(sw_rep)
136 {
137 int i;
138
139 for (i = 0; i < NUM_VPORT_REP_SW_COUNTERS; i++)
140 ethtool_puts(data, sw_rep_stats_desc[i].format);
141 }
142
MLX5E_DECLARE_STATS_GRP_OP_FILL_STATS(sw_rep)143 static MLX5E_DECLARE_STATS_GRP_OP_FILL_STATS(sw_rep)
144 {
145 int i;
146
147 for (i = 0; i < NUM_VPORT_REP_SW_COUNTERS; i++)
148 mlx5e_ethtool_put_stat(
149 data, MLX5E_READ_CTR64_CPU(&priv->stats.sw,
150 sw_rep_stats_desc, i));
151 }
152
MLX5E_DECLARE_STATS_GRP_OP_UPDATE_STATS(sw_rep)153 static MLX5E_DECLARE_STATS_GRP_OP_UPDATE_STATS(sw_rep)
154 {
155 struct mlx5e_sw_stats *s = &priv->stats.sw;
156 struct rtnl_link_stats64 stats64 = {};
157
158 memset(s, 0, sizeof(*s));
159 mlx5e_fold_sw_stats64(priv, &stats64);
160
161 s->rx_packets = stats64.rx_packets;
162 s->rx_bytes = stats64.rx_bytes;
163 s->tx_packets = stats64.tx_packets;
164 s->tx_bytes = stats64.tx_bytes;
165 s->tx_queue_dropped = stats64.tx_dropped;
166 }
167
MLX5E_DECLARE_STATS_GRP_OP_NUM_STATS(vport_rep)168 static MLX5E_DECLARE_STATS_GRP_OP_NUM_STATS(vport_rep)
169 {
170 return NUM_VPORT_REP_HW_COUNTERS +
171 NUM_VPORT_REP_LOOPBACK_COUNTERS(priv->mdev);
172 }
173
MLX5E_DECLARE_STATS_GRP_OP_FILL_STRS(vport_rep)174 static MLX5E_DECLARE_STATS_GRP_OP_FILL_STRS(vport_rep)
175 {
176 int i;
177
178 for (i = 0; i < NUM_VPORT_REP_HW_COUNTERS; i++)
179 ethtool_puts(data, vport_rep_stats_desc[i].format);
180 for (i = 0; i < NUM_VPORT_REP_LOOPBACK_COUNTERS(priv->mdev); i++)
181 ethtool_puts(data, vport_rep_loopback_stats_desc[i].format);
182 }
183
MLX5E_DECLARE_STATS_GRP_OP_FILL_STATS(vport_rep)184 static MLX5E_DECLARE_STATS_GRP_OP_FILL_STATS(vport_rep)
185 {
186 int i;
187
188 for (i = 0; i < NUM_VPORT_REP_HW_COUNTERS; i++)
189 mlx5e_ethtool_put_stat(
190 data, MLX5E_READ_CTR64_CPU(&priv->stats.rep_stats,
191 vport_rep_stats_desc, i));
192 for (i = 0; i < NUM_VPORT_REP_LOOPBACK_COUNTERS(priv->mdev); i++)
193 mlx5e_ethtool_put_stat(
194 data,
195 MLX5E_READ_CTR64_CPU(&priv->stats.rep_stats,
196 vport_rep_loopback_stats_desc, i));
197 }
198
MLX5E_DECLARE_STATS_GRP_OP_UPDATE_STATS(vport_rep)199 static MLX5E_DECLARE_STATS_GRP_OP_UPDATE_STATS(vport_rep)
200 {
201 struct mlx5e_rep_stats *rep_stats = &priv->stats.rep_stats;
202 int outlen = MLX5_ST_SZ_BYTES(query_vport_counter_out);
203 struct mlx5_eswitch *esw = priv->mdev->priv.eswitch;
204 struct mlx5e_rep_priv *rpriv = priv->ppriv;
205 struct mlx5_eswitch_rep *rep = rpriv->rep;
206 u32 *out;
207 int err;
208
209 out = kvzalloc(outlen, GFP_KERNEL);
210 if (!out)
211 return;
212
213 err = mlx5_core_query_vport_counter(esw->dev, 1, rep->vport - 1, 0, out);
214 if (err) {
215 netdev_warn(priv->netdev, "vport %d error %d reading stats\n",
216 rep->vport, err);
217 goto out;
218 }
219
220 #define MLX5_GET_CTR(p, x) \
221 MLX5_GET64(query_vport_counter_out, p, x)
222 /* flip tx/rx as we are reporting the counters for the switch vport */
223 rep_stats->vport_rx_packets =
224 MLX5_GET_CTR(out, transmitted_ib_unicast.packets) +
225 MLX5_GET_CTR(out, transmitted_eth_unicast.packets) +
226 MLX5_GET_CTR(out, transmitted_ib_multicast.packets) +
227 MLX5_GET_CTR(out, transmitted_eth_multicast.packets) +
228 MLX5_GET_CTR(out, transmitted_eth_broadcast.packets);
229
230 rep_stats->vport_tx_packets =
231 MLX5_GET_CTR(out, received_ib_unicast.packets) +
232 MLX5_GET_CTR(out, received_eth_unicast.packets) +
233 MLX5_GET_CTR(out, received_ib_multicast.packets) +
234 MLX5_GET_CTR(out, received_eth_multicast.packets) +
235 MLX5_GET_CTR(out, received_eth_broadcast.packets);
236
237 rep_stats->vport_rx_bytes =
238 MLX5_GET_CTR(out, transmitted_ib_unicast.octets) +
239 MLX5_GET_CTR(out, transmitted_eth_unicast.octets) +
240 MLX5_GET_CTR(out, transmitted_ib_multicast.octets) +
241 MLX5_GET_CTR(out, transmitted_eth_broadcast.octets);
242
243 rep_stats->vport_tx_bytes =
244 MLX5_GET_CTR(out, received_ib_unicast.octets) +
245 MLX5_GET_CTR(out, received_eth_unicast.octets) +
246 MLX5_GET_CTR(out, received_ib_multicast.octets) +
247 MLX5_GET_CTR(out, received_eth_multicast.octets) +
248 MLX5_GET_CTR(out, received_eth_broadcast.octets);
249
250 rep_stats->rx_vport_rdma_unicast_packets =
251 MLX5_GET_CTR(out, transmitted_ib_unicast.packets);
252 rep_stats->tx_vport_rdma_unicast_packets =
253 MLX5_GET_CTR(out, received_ib_unicast.packets);
254 rep_stats->rx_vport_rdma_unicast_bytes =
255 MLX5_GET_CTR(out, transmitted_ib_unicast.octets);
256 rep_stats->tx_vport_rdma_unicast_bytes =
257 MLX5_GET_CTR(out, received_ib_unicast.octets);
258 rep_stats->rx_vport_rdma_multicast_packets =
259 MLX5_GET_CTR(out, transmitted_ib_multicast.packets);
260 rep_stats->tx_vport_rdma_multicast_packets =
261 MLX5_GET_CTR(out, received_ib_multicast.packets);
262 rep_stats->rx_vport_rdma_multicast_bytes =
263 MLX5_GET_CTR(out, transmitted_ib_multicast.octets);
264 rep_stats->tx_vport_rdma_multicast_bytes =
265 MLX5_GET_CTR(out, received_ib_multicast.octets);
266
267 if (MLX5_CAP_GEN(priv->mdev, vport_counter_local_loopback)) {
268 rep_stats->vport_loopback_packets =
269 MLX5_GET_CTR(out, local_loopback.packets);
270 rep_stats->vport_loopback_bytes =
271 MLX5_GET_CTR(out, local_loopback.octets);
272 }
273
274 out:
275 kvfree(out);
276 }
277
mlx5e_rep_query_aggr_q_counter(struct mlx5_core_dev * dev,int vport,void * out)278 static int mlx5e_rep_query_aggr_q_counter(struct mlx5_core_dev *dev, int vport, void *out)
279 {
280 u32 in[MLX5_ST_SZ_DW(query_q_counter_in)] = {};
281
282 MLX5_SET(query_q_counter_in, in, opcode, MLX5_CMD_OP_QUERY_Q_COUNTER);
283 MLX5_SET(query_q_counter_in, in, other_vport, 1);
284 MLX5_SET(query_q_counter_in, in, vport_number, vport);
285 MLX5_SET(query_q_counter_in, in, aggregate, 1);
286
287 return mlx5_cmd_exec_inout(dev, query_q_counter, in, out);
288 }
289
mlx5e_rep_update_vport_q_counter(struct mlx5e_priv * priv)290 static void mlx5e_rep_update_vport_q_counter(struct mlx5e_priv *priv)
291 {
292 struct mlx5e_rep_stats *rep_stats = &priv->stats.rep_stats;
293 u32 out[MLX5_ST_SZ_DW(query_q_counter_out)] = {};
294 struct mlx5e_rep_priv *rpriv = priv->ppriv;
295 struct mlx5_eswitch_rep *rep = rpriv->rep;
296 int err;
297
298 if (!MLX5_CAP_GEN(priv->mdev, q_counter_other_vport) ||
299 !MLX5_CAP_GEN(priv->mdev, q_counter_aggregation))
300 return;
301
302 err = mlx5e_rep_query_aggr_q_counter(priv->mdev, rep->vport, out);
303 if (err) {
304 netdev_warn(priv->netdev, "failed reading stats on vport %d, error %d\n",
305 rep->vport, err);
306 return;
307 }
308
309 rep_stats->rx_vport_out_of_buffer = MLX5_GET(query_q_counter_out, out, out_of_buffer);
310 }
311
mlx5e_rep_get_strings(struct net_device * dev,u32 stringset,u8 * data)312 static void mlx5e_rep_get_strings(struct net_device *dev,
313 u32 stringset, u8 *data)
314 {
315 struct mlx5e_priv *priv = netdev_priv(dev);
316
317 switch (stringset) {
318 case ETH_SS_STATS:
319 mlx5e_stats_fill_strings(priv, data);
320 break;
321 }
322 }
323
mlx5e_rep_get_ethtool_stats(struct net_device * dev,struct ethtool_stats * stats,u64 * data)324 static void mlx5e_rep_get_ethtool_stats(struct net_device *dev,
325 struct ethtool_stats *stats, u64 *data)
326 {
327 struct mlx5e_priv *priv = netdev_priv(dev);
328
329 mlx5e_ethtool_get_ethtool_stats(priv, stats, data);
330 }
331
mlx5e_rep_get_sset_count(struct net_device * dev,int sset)332 static int mlx5e_rep_get_sset_count(struct net_device *dev, int sset)
333 {
334 struct mlx5e_priv *priv = netdev_priv(dev);
335
336 switch (sset) {
337 case ETH_SS_STATS:
338 return mlx5e_stats_total_num(priv);
339 default:
340 return -EOPNOTSUPP;
341 }
342 }
343
344 static void
mlx5e_rep_get_ringparam(struct net_device * dev,struct ethtool_ringparam * param,struct kernel_ethtool_ringparam * kernel_param,struct netlink_ext_ack * extack)345 mlx5e_rep_get_ringparam(struct net_device *dev,
346 struct ethtool_ringparam *param,
347 struct kernel_ethtool_ringparam *kernel_param,
348 struct netlink_ext_ack *extack)
349 {
350 struct mlx5e_priv *priv = netdev_priv(dev);
351
352 mlx5e_ethtool_get_ringparam(priv, param, kernel_param);
353 }
354
355 static int
mlx5e_rep_set_ringparam(struct net_device * dev,struct ethtool_ringparam * param,struct kernel_ethtool_ringparam * kernel_param,struct netlink_ext_ack * extack)356 mlx5e_rep_set_ringparam(struct net_device *dev,
357 struct ethtool_ringparam *param,
358 struct kernel_ethtool_ringparam *kernel_param,
359 struct netlink_ext_ack *extack)
360 {
361 struct mlx5e_priv *priv = netdev_priv(dev);
362
363 return mlx5e_ethtool_set_ringparam(priv, param, extack);
364 }
365
mlx5e_rep_get_channels(struct net_device * dev,struct ethtool_channels * ch)366 static void mlx5e_rep_get_channels(struct net_device *dev,
367 struct ethtool_channels *ch)
368 {
369 struct mlx5e_priv *priv = netdev_priv(dev);
370
371 mlx5e_ethtool_get_channels(priv, ch);
372 }
373
mlx5e_rep_set_channels(struct net_device * dev,struct ethtool_channels * ch)374 static int mlx5e_rep_set_channels(struct net_device *dev,
375 struct ethtool_channels *ch)
376 {
377 struct mlx5e_priv *priv = netdev_priv(dev);
378
379 return mlx5e_ethtool_set_channels(priv, ch);
380 }
381
mlx5e_rep_get_coalesce(struct net_device * netdev,struct ethtool_coalesce * coal,struct kernel_ethtool_coalesce * kernel_coal,struct netlink_ext_ack * extack)382 static int mlx5e_rep_get_coalesce(struct net_device *netdev,
383 struct ethtool_coalesce *coal,
384 struct kernel_ethtool_coalesce *kernel_coal,
385 struct netlink_ext_ack *extack)
386 {
387 struct mlx5e_priv *priv = netdev_priv(netdev);
388
389 return mlx5e_ethtool_get_coalesce(priv, coal, kernel_coal, extack);
390 }
391
mlx5e_rep_set_coalesce(struct net_device * netdev,struct ethtool_coalesce * coal,struct kernel_ethtool_coalesce * kernel_coal,struct netlink_ext_ack * extack)392 static int mlx5e_rep_set_coalesce(struct net_device *netdev,
393 struct ethtool_coalesce *coal,
394 struct kernel_ethtool_coalesce *kernel_coal,
395 struct netlink_ext_ack *extack)
396 {
397 struct mlx5e_priv *priv = netdev_priv(netdev);
398
399 return mlx5e_ethtool_set_coalesce(priv, coal, kernel_coal, extack);
400 }
401
mlx5e_rep_get_rxfh_key_size(struct net_device * netdev)402 static u32 mlx5e_rep_get_rxfh_key_size(struct net_device *netdev)
403 {
404 struct mlx5e_priv *priv = netdev_priv(netdev);
405
406 return mlx5e_ethtool_get_rxfh_key_size(priv);
407 }
408
mlx5e_rep_get_rxfh_indir_size(struct net_device * netdev)409 static u32 mlx5e_rep_get_rxfh_indir_size(struct net_device *netdev)
410 {
411 struct mlx5e_priv *priv = netdev_priv(netdev);
412
413 return mlx5e_ethtool_get_rxfh_indir_size(priv);
414 }
415
416 static const struct ethtool_ops mlx5e_rep_ethtool_ops = {
417 .supported_coalesce_params = ETHTOOL_COALESCE_USECS |
418 ETHTOOL_COALESCE_MAX_FRAMES |
419 ETHTOOL_COALESCE_USE_ADAPTIVE,
420 .get_drvinfo = mlx5e_rep_get_drvinfo,
421 .get_link = ethtool_op_get_link,
422 .get_strings = mlx5e_rep_get_strings,
423 .get_sset_count = mlx5e_rep_get_sset_count,
424 .get_ethtool_stats = mlx5e_rep_get_ethtool_stats,
425 .get_ringparam = mlx5e_rep_get_ringparam,
426 .set_ringparam = mlx5e_rep_set_ringparam,
427 .get_channels = mlx5e_rep_get_channels,
428 .set_channels = mlx5e_rep_set_channels,
429 .get_coalesce = mlx5e_rep_get_coalesce,
430 .set_coalesce = mlx5e_rep_set_coalesce,
431 .get_per_queue_coalesce = mlx5e_get_per_queue_coalesce,
432 .set_per_queue_coalesce = mlx5e_set_per_queue_coalesce,
433 .get_rxfh_key_size = mlx5e_rep_get_rxfh_key_size,
434 .get_rxfh_indir_size = mlx5e_rep_get_rxfh_indir_size,
435 };
436
mlx5e_sqs2vport_stop(struct mlx5_eswitch * esw,struct mlx5_eswitch_rep * rep)437 static void mlx5e_sqs2vport_stop(struct mlx5_eswitch *esw,
438 struct mlx5_eswitch_rep *rep)
439 {
440 struct mlx5e_rep_sq *rep_sq, *tmp;
441 struct mlx5e_rep_sq_peer *sq_peer;
442 struct mlx5e_rep_priv *rpriv;
443 unsigned long i;
444
445 if (esw->mode != MLX5_ESWITCH_OFFLOADS)
446 return;
447
448 rpriv = mlx5e_rep_to_rep_priv(rep);
449 list_for_each_entry_safe(rep_sq, tmp, &rpriv->vport_sqs_list, list) {
450 mlx5_eswitch_del_send_to_vport_rule(rep_sq->send_to_vport_rule);
451 xa_for_each(&rep_sq->sq_peer, i, sq_peer) {
452 if (sq_peer->rule)
453 mlx5_eswitch_del_send_to_vport_rule(sq_peer->rule);
454
455 xa_erase(&rep_sq->sq_peer, i);
456 kfree(sq_peer);
457 }
458
459 xa_destroy(&rep_sq->sq_peer);
460 list_del(&rep_sq->list);
461 kfree(rep_sq);
462 }
463 }
464
mlx5e_sqs2vport_add_peers_rules(struct mlx5_eswitch * esw,struct mlx5_eswitch_rep * rep,struct mlx5e_rep_sq * rep_sq,int i)465 static int mlx5e_sqs2vport_add_peers_rules(struct mlx5_eswitch *esw, struct mlx5_eswitch_rep *rep,
466 struct mlx5e_rep_sq *rep_sq, int i)
467 {
468 struct mlx5_flow_handle *flow_rule;
469 struct mlx5_devcom_comp_dev *tmp;
470 struct mlx5_eswitch *peer_esw;
471
472 mlx5_devcom_for_each_peer_entry(esw->devcom, peer_esw, tmp) {
473 u16 peer_rule_idx = MLX5_CAP_GEN(peer_esw->dev, vhca_id);
474 struct mlx5e_rep_sq_peer *sq_peer;
475 int err;
476
477 sq_peer = kzalloc(sizeof(*sq_peer), GFP_KERNEL);
478 if (!sq_peer)
479 return -ENOMEM;
480
481 flow_rule = mlx5_eswitch_add_send_to_vport_rule(peer_esw, esw,
482 rep, rep_sq->sqn);
483 if (IS_ERR(flow_rule)) {
484 kfree(sq_peer);
485 return PTR_ERR(flow_rule);
486 }
487
488 sq_peer->rule = flow_rule;
489 sq_peer->peer = peer_esw;
490 err = xa_insert(&rep_sq->sq_peer, peer_rule_idx, sq_peer, GFP_KERNEL);
491 if (err) {
492 kfree(sq_peer);
493 mlx5_eswitch_del_send_to_vport_rule(flow_rule);
494 return err;
495 }
496 }
497
498 return 0;
499 }
500
mlx5e_sqs2vport_start(struct mlx5_eswitch * esw,struct mlx5_eswitch_rep * rep,u32 * sqns_array,int sqns_num)501 static int mlx5e_sqs2vport_start(struct mlx5_eswitch *esw,
502 struct mlx5_eswitch_rep *rep,
503 u32 *sqns_array, int sqns_num)
504 {
505 struct mlx5_flow_handle *flow_rule;
506 struct mlx5e_rep_priv *rpriv;
507 struct mlx5e_rep_sq *rep_sq;
508 bool devcom_locked = false;
509 int err;
510 int i;
511
512 if (esw->mode != MLX5_ESWITCH_OFFLOADS)
513 return 0;
514
515 rpriv = mlx5e_rep_to_rep_priv(rep);
516
517 if (mlx5_devcom_comp_is_ready(esw->devcom) &&
518 mlx5_devcom_for_each_peer_begin(esw->devcom))
519 devcom_locked = true;
520
521 for (i = 0; i < sqns_num; i++) {
522 rep_sq = kzalloc(sizeof(*rep_sq), GFP_KERNEL);
523 if (!rep_sq) {
524 err = -ENOMEM;
525 goto out_err;
526 }
527
528 /* Add re-inject rule to the PF/representor sqs */
529 flow_rule = mlx5_eswitch_add_send_to_vport_rule(esw, esw, rep,
530 sqns_array[i]);
531 if (IS_ERR(flow_rule)) {
532 err = PTR_ERR(flow_rule);
533 kfree(rep_sq);
534 goto out_err;
535 }
536 rep_sq->send_to_vport_rule = flow_rule;
537 rep_sq->sqn = sqns_array[i];
538
539 xa_init(&rep_sq->sq_peer);
540 if (devcom_locked) {
541 err = mlx5e_sqs2vport_add_peers_rules(esw, rep, rep_sq, i);
542 if (err) {
543 mlx5_eswitch_del_send_to_vport_rule(rep_sq->send_to_vport_rule);
544 xa_destroy(&rep_sq->sq_peer);
545 kfree(rep_sq);
546 goto out_err;
547 }
548 }
549
550 list_add(&rep_sq->list, &rpriv->vport_sqs_list);
551 }
552
553 if (devcom_locked)
554 mlx5_devcom_for_each_peer_end(esw->devcom);
555
556 return 0;
557
558 out_err:
559 mlx5e_sqs2vport_stop(esw, rep);
560
561 if (devcom_locked)
562 mlx5_devcom_for_each_peer_end(esw->devcom);
563
564 return err;
565 }
566
567 static int
mlx5e_add_sqs_fwd_rules(struct mlx5e_priv * priv)568 mlx5e_add_sqs_fwd_rules(struct mlx5e_priv *priv)
569 {
570 int sqs_per_channel = mlx5e_get_dcb_num_tc(&priv->channels.params);
571 struct mlx5_eswitch *esw = priv->mdev->priv.eswitch;
572 bool is_uplink_rep = mlx5e_is_uplink_rep(priv);
573 struct mlx5e_rep_priv *rpriv = priv->ppriv;
574 struct mlx5_eswitch_rep *rep = rpriv->rep;
575 int n, tc, nch, num_sqs = 0;
576 struct mlx5e_channel *c;
577 int err = -ENOMEM;
578 bool ptp_sq;
579 u32 *sqs;
580
581 ptp_sq = !!(priv->channels.ptp &&
582 MLX5E_GET_PFLAG(&priv->channels.params, MLX5E_PFLAG_TX_PORT_TS));
583 nch = priv->channels.num + ptp_sq;
584 /* +2 for xdpsqs, they don't exist on the ptp channel but will not be
585 * counted for by num_sqs.
586 */
587 if (is_uplink_rep)
588 sqs_per_channel += 2;
589
590 sqs = kvcalloc(nch * sqs_per_channel, sizeof(*sqs), GFP_KERNEL);
591 if (!sqs)
592 goto out;
593
594 for (n = 0; n < priv->channels.num; n++) {
595 c = priv->channels.c[n];
596 for (tc = 0; tc < c->num_tc; tc++)
597 sqs[num_sqs++] = c->sq[tc].sqn;
598
599 if (is_uplink_rep) {
600 if (c->xdp)
601 sqs[num_sqs++] = c->rq_xdpsq.sqn;
602
603 if (c->xdpsq)
604 sqs[num_sqs++] = c->xdpsq->sqn;
605 }
606 }
607 if (ptp_sq) {
608 struct mlx5e_ptp *ptp_ch = priv->channels.ptp;
609
610 for (tc = 0; tc < ptp_ch->num_tc; tc++)
611 sqs[num_sqs++] = ptp_ch->ptpsq[tc].txqsq.sqn;
612 }
613
614 err = mlx5e_sqs2vport_start(esw, rep, sqs, num_sqs);
615 kvfree(sqs);
616
617 out:
618 if (err)
619 netdev_warn(priv->netdev, "Failed to add SQs FWD rules %d\n", err);
620 return err;
621 }
622
623 static void
mlx5e_remove_sqs_fwd_rules(struct mlx5e_priv * priv)624 mlx5e_remove_sqs_fwd_rules(struct mlx5e_priv *priv)
625 {
626 struct mlx5_eswitch *esw = priv->mdev->priv.eswitch;
627 struct mlx5e_rep_priv *rpriv = priv->ppriv;
628 struct mlx5_eswitch_rep *rep = rpriv->rep;
629
630 mlx5e_sqs2vport_stop(esw, rep);
631 }
632
633 static int
mlx5e_rep_add_meta_tunnel_rule(struct mlx5e_priv * priv)634 mlx5e_rep_add_meta_tunnel_rule(struct mlx5e_priv *priv)
635 {
636 struct mlx5_eswitch *esw = priv->mdev->priv.eswitch;
637 struct mlx5e_rep_priv *rpriv = priv->ppriv;
638 struct mlx5_eswitch_rep *rep = rpriv->rep;
639 struct mlx5_flow_handle *flow_rule;
640 struct mlx5_flow_group *g;
641
642 g = esw->fdb_table.offloads.send_to_vport_meta_grp;
643 if (!g)
644 return 0;
645
646 flow_rule = mlx5_eswitch_add_send_to_vport_meta_rule(esw, rep->vport);
647 if (IS_ERR(flow_rule))
648 return PTR_ERR(flow_rule);
649
650 rpriv->send_to_vport_meta_rule = flow_rule;
651
652 return 0;
653 }
654
655 static void
mlx5e_rep_del_meta_tunnel_rule(struct mlx5e_priv * priv)656 mlx5e_rep_del_meta_tunnel_rule(struct mlx5e_priv *priv)
657 {
658 struct mlx5e_rep_priv *rpriv = priv->ppriv;
659
660 if (rpriv->send_to_vport_meta_rule)
661 mlx5_eswitch_del_send_to_vport_meta_rule(rpriv->send_to_vport_meta_rule);
662 }
663
mlx5e_rep_activate_channels(struct mlx5e_priv * priv)664 void mlx5e_rep_activate_channels(struct mlx5e_priv *priv)
665 {
666 mlx5e_add_sqs_fwd_rules(priv);
667 mlx5e_rep_add_meta_tunnel_rule(priv);
668 }
669
mlx5e_rep_deactivate_channels(struct mlx5e_priv * priv)670 void mlx5e_rep_deactivate_channels(struct mlx5e_priv *priv)
671 {
672 mlx5e_rep_del_meta_tunnel_rule(priv);
673 mlx5e_remove_sqs_fwd_rules(priv);
674 }
675
mlx5e_rep_open(struct net_device * dev)676 static int mlx5e_rep_open(struct net_device *dev)
677 {
678 struct mlx5e_priv *priv = netdev_priv(dev);
679 struct mlx5e_rep_priv *rpriv = priv->ppriv;
680 struct mlx5_eswitch_rep *rep = rpriv->rep;
681 int err;
682
683 mutex_lock(&priv->state_lock);
684 err = mlx5e_open_locked(dev);
685 if (err)
686 goto unlock;
687
688 if (!mlx5_modify_vport_admin_state(priv->mdev,
689 MLX5_VPORT_STATE_OP_MOD_ESW_VPORT,
690 rep->vport, 1,
691 MLX5_VPORT_ADMIN_STATE_UP))
692 netif_carrier_on(dev);
693
694 unlock:
695 mutex_unlock(&priv->state_lock);
696 return err;
697 }
698
mlx5e_rep_close(struct net_device * dev)699 static int mlx5e_rep_close(struct net_device *dev)
700 {
701 struct mlx5e_priv *priv = netdev_priv(dev);
702 struct mlx5e_rep_priv *rpriv = priv->ppriv;
703 struct mlx5_eswitch_rep *rep = rpriv->rep;
704 int ret;
705
706 mutex_lock(&priv->state_lock);
707 mlx5_modify_vport_admin_state(priv->mdev,
708 MLX5_VPORT_STATE_OP_MOD_ESW_VPORT,
709 rep->vport, 1,
710 MLX5_VPORT_ADMIN_STATE_DOWN);
711 ret = mlx5e_close_locked(dev);
712 mutex_unlock(&priv->state_lock);
713 return ret;
714 }
715
mlx5e_is_uplink_rep(struct mlx5e_priv * priv)716 bool mlx5e_is_uplink_rep(struct mlx5e_priv *priv)
717 {
718 struct mlx5e_rep_priv *rpriv = priv->ppriv;
719 struct mlx5_eswitch_rep *rep;
720
721 if (!MLX5_ESWITCH_MANAGER(priv->mdev))
722 return false;
723
724 if (!rpriv) /* non vport rep mlx5e instances don't use this field */
725 return false;
726
727 rep = rpriv->rep;
728 return (rep->vport == MLX5_VPORT_UPLINK);
729 }
730
mlx5e_rep_has_offload_stats(const struct net_device * dev,int attr_id)731 bool mlx5e_rep_has_offload_stats(const struct net_device *dev, int attr_id)
732 {
733 switch (attr_id) {
734 case IFLA_OFFLOAD_XSTATS_CPU_HIT:
735 return true;
736 }
737
738 return false;
739 }
740
741 static int
mlx5e_get_sw_stats64(const struct net_device * dev,struct rtnl_link_stats64 * stats)742 mlx5e_get_sw_stats64(const struct net_device *dev,
743 struct rtnl_link_stats64 *stats)
744 {
745 struct mlx5e_priv *priv = netdev_priv(dev);
746
747 mlx5e_fold_sw_stats64(priv, stats);
748 return 0;
749 }
750
mlx5e_rep_get_offload_stats(int attr_id,const struct net_device * dev,void * sp)751 int mlx5e_rep_get_offload_stats(int attr_id, const struct net_device *dev,
752 void *sp)
753 {
754 switch (attr_id) {
755 case IFLA_OFFLOAD_XSTATS_CPU_HIT:
756 return mlx5e_get_sw_stats64(dev, sp);
757 }
758
759 return -EINVAL;
760 }
761
762 static void
mlx5e_rep_get_stats(struct net_device * dev,struct rtnl_link_stats64 * stats)763 mlx5e_rep_get_stats(struct net_device *dev, struct rtnl_link_stats64 *stats)
764 {
765 struct mlx5e_priv *priv = netdev_priv(dev);
766
767 /* update HW stats in background for next time */
768 mlx5e_queue_update_stats(priv);
769 mlx5e_stats_copy_rep_stats(stats, &priv->stats.rep_stats);
770 }
771
mlx5e_rep_change_mtu(struct net_device * netdev,int new_mtu)772 static int mlx5e_rep_change_mtu(struct net_device *netdev, int new_mtu)
773 {
774 return mlx5e_change_mtu(netdev, new_mtu, NULL);
775 }
776
mlx5e_rep_change_carrier(struct net_device * dev,bool new_carrier)777 static int mlx5e_rep_change_carrier(struct net_device *dev, bool new_carrier)
778 {
779 struct mlx5e_priv *priv = netdev_priv(dev);
780 struct mlx5e_rep_priv *rpriv = priv->ppriv;
781 struct mlx5_eswitch_rep *rep = rpriv->rep;
782 int err;
783
784 if (new_carrier) {
785 err = mlx5_modify_vport_admin_state(priv->mdev, MLX5_VPORT_STATE_OP_MOD_ESW_VPORT,
786 rep->vport, 1, MLX5_VPORT_ADMIN_STATE_UP);
787 if (err)
788 return err;
789 netif_carrier_on(dev);
790 } else {
791 err = mlx5_modify_vport_admin_state(priv->mdev, MLX5_VPORT_STATE_OP_MOD_ESW_VPORT,
792 rep->vport, 1, MLX5_VPORT_ADMIN_STATE_DOWN);
793 if (err)
794 return err;
795 netif_carrier_off(dev);
796 }
797 return 0;
798 }
799
800 static const struct net_device_ops mlx5e_netdev_ops_rep = {
801 .ndo_open = mlx5e_rep_open,
802 .ndo_stop = mlx5e_rep_close,
803 .ndo_start_xmit = mlx5e_xmit,
804 .ndo_setup_tc = mlx5e_rep_setup_tc,
805 .ndo_get_stats64 = mlx5e_rep_get_stats,
806 .ndo_has_offload_stats = mlx5e_rep_has_offload_stats,
807 .ndo_get_offload_stats = mlx5e_rep_get_offload_stats,
808 .ndo_change_mtu = mlx5e_rep_change_mtu,
809 .ndo_change_carrier = mlx5e_rep_change_carrier,
810 };
811
mlx5e_eswitch_uplink_rep(const struct net_device * netdev)812 bool mlx5e_eswitch_uplink_rep(const struct net_device *netdev)
813 {
814 return netdev->netdev_ops == &mlx5e_netdev_ops &&
815 mlx5e_is_uplink_rep(netdev_priv(netdev));
816 }
817
mlx5e_eswitch_vf_rep(const struct net_device * netdev)818 bool mlx5e_eswitch_vf_rep(const struct net_device *netdev)
819 {
820 return netdev->netdev_ops == &mlx5e_netdev_ops_rep;
821 }
822
823 /* One indirect TIR set for outer. Inner not supported in reps. */
824 #define REP_NUM_INDIR_TIRS MLX5E_NUM_INDIR_TIRS
825
mlx5e_rep_max_nch_limit(struct mlx5_core_dev * mdev)826 static int mlx5e_rep_max_nch_limit(struct mlx5_core_dev *mdev)
827 {
828 int max_tir_num = 1 << MLX5_CAP_GEN(mdev, log_max_tir);
829 int num_vports = mlx5_eswitch_get_total_vports(mdev);
830
831 return (max_tir_num - mlx5e_get_pf_num_tirs(mdev)
832 - (num_vports * REP_NUM_INDIR_TIRS)) / num_vports;
833 }
834
mlx5e_build_rep_params(struct net_device * netdev)835 static void mlx5e_build_rep_params(struct net_device *netdev)
836 {
837 const bool take_rtnl = netdev->reg_state == NETREG_REGISTERED;
838 struct mlx5e_priv *priv = netdev_priv(netdev);
839 struct mlx5e_rep_priv *rpriv = priv->ppriv;
840 struct mlx5_eswitch_rep *rep = rpriv->rep;
841 struct mlx5_core_dev *mdev = priv->mdev;
842 struct mlx5e_params *params;
843
844 params = &priv->channels.params;
845
846 params->num_channels = MLX5E_REP_PARAMS_DEF_NUM_CHANNELS;
847 params->hard_mtu = MLX5E_ETH_HARD_MTU;
848 params->sw_mtu = netdev->mtu;
849
850 /* SQ */
851 if (rep->vport == MLX5_VPORT_UPLINK)
852 params->log_sq_size = MLX5E_PARAMS_DEFAULT_LOG_SQ_SIZE;
853 else
854 params->log_sq_size = MLX5E_REP_PARAMS_DEF_LOG_SQ_SIZE;
855
856 /* RQ */
857 mlx5e_build_rq_params(mdev, params);
858
859 /* If netdev is already registered (e.g. move from nic profile to uplink,
860 * RTNL lock must be held before triggering netdev notifiers.
861 */
862 if (take_rtnl)
863 rtnl_lock();
864 /* update XDP supported features */
865 mlx5e_set_xdp_feature(netdev);
866 if (take_rtnl)
867 rtnl_unlock();
868
869 /* CQ moderation params */
870 params->rx_dim_enabled = MLX5_CAP_GEN(mdev, cq_moderation);
871 params->rx_moder_use_cqe_mode = !!MLX5_CAP_GEN(mdev, cq_period_start_from_cqe);
872
873 params->mqprio.num_tc = 1;
874 if (rep->vport != MLX5_VPORT_UPLINK)
875 params->vlan_strip_disable = true;
876
877 mlx5_query_min_inline(mdev, ¶ms->tx_min_inline_mode);
878 }
879
mlx5e_build_rep_netdev(struct net_device * netdev,struct mlx5_core_dev * mdev)880 static void mlx5e_build_rep_netdev(struct net_device *netdev,
881 struct mlx5_core_dev *mdev)
882 {
883 SET_NETDEV_DEV(netdev, mdev->device);
884 netdev->netdev_ops = &mlx5e_netdev_ops_rep;
885 eth_hw_addr_random(netdev);
886 netdev->ethtool_ops = &mlx5e_rep_ethtool_ops;
887
888 netdev->watchdog_timeo = 15 * HZ;
889
890 #if IS_ENABLED(CONFIG_MLX5_CLS_ACT)
891 netdev->hw_features |= NETIF_F_HW_TC;
892 #endif
893 netdev->hw_features |= NETIF_F_SG;
894 netdev->hw_features |= NETIF_F_IP_CSUM;
895 netdev->hw_features |= NETIF_F_IPV6_CSUM;
896 netdev->hw_features |= NETIF_F_GRO;
897 netdev->hw_features |= NETIF_F_TSO;
898 netdev->hw_features |= NETIF_F_TSO6;
899 netdev->hw_features |= NETIF_F_RXCSUM;
900
901 netdev->features |= netdev->hw_features;
902
903 netdev->netns_local = true;
904 }
905
mlx5e_init_rep(struct mlx5_core_dev * mdev,struct net_device * netdev)906 static int mlx5e_init_rep(struct mlx5_core_dev *mdev,
907 struct net_device *netdev)
908 {
909 struct mlx5e_priv *priv = netdev_priv(netdev);
910
911 priv->fs =
912 mlx5e_fs_init(priv->profile, mdev,
913 !test_bit(MLX5E_STATE_DESTROYING, &priv->state),
914 priv->dfs_root);
915 if (!priv->fs) {
916 netdev_err(priv->netdev, "FS allocation failed\n");
917 return -ENOMEM;
918 }
919
920 mlx5e_build_rep_params(netdev);
921 mlx5e_timestamp_init(priv);
922
923 return 0;
924 }
925
mlx5e_init_ul_rep(struct mlx5_core_dev * mdev,struct net_device * netdev)926 static int mlx5e_init_ul_rep(struct mlx5_core_dev *mdev,
927 struct net_device *netdev)
928 {
929 struct mlx5e_priv *priv = netdev_priv(netdev);
930
931 priv->dfs_root = debugfs_create_dir("nic",
932 mlx5_debugfs_get_dev_root(mdev));
933
934 priv->fs = mlx5e_fs_init(priv->profile, mdev,
935 !test_bit(MLX5E_STATE_DESTROYING, &priv->state),
936 priv->dfs_root);
937 if (!priv->fs) {
938 netdev_err(priv->netdev, "FS allocation failed\n");
939 debugfs_remove_recursive(priv->dfs_root);
940 return -ENOMEM;
941 }
942
943 mlx5e_vxlan_set_netdev_info(priv);
944 mlx5e_build_rep_params(netdev);
945 mlx5e_timestamp_init(priv);
946 return 0;
947 }
948
mlx5e_cleanup_rep(struct mlx5e_priv * priv)949 static void mlx5e_cleanup_rep(struct mlx5e_priv *priv)
950 {
951 mlx5e_fs_cleanup(priv->fs);
952 debugfs_remove_recursive(priv->dfs_root);
953 priv->fs = NULL;
954 }
955
mlx5e_create_rep_ttc_table(struct mlx5e_priv * priv)956 static int mlx5e_create_rep_ttc_table(struct mlx5e_priv *priv)
957 {
958 struct mlx5e_rep_priv *rpriv = priv->ppriv;
959 struct mlx5_eswitch_rep *rep = rpriv->rep;
960 struct ttc_params ttc_params = {};
961 int err;
962
963 mlx5e_fs_set_ns(priv->fs,
964 mlx5_get_flow_namespace(priv->mdev,
965 MLX5_FLOW_NAMESPACE_KERNEL), false);
966
967 /* The inner_ttc in the ttc params is intentionally not set */
968 mlx5e_set_ttc_params(priv->fs, priv->rx_res, &ttc_params, false);
969
970 if (rep->vport != MLX5_VPORT_UPLINK)
971 /* To give uplik rep TTC a lower level for chaining from root ft */
972 ttc_params.ft_attr.level = MLX5E_TTC_FT_LEVEL + 1;
973
974 mlx5e_fs_set_ttc(priv->fs, mlx5_create_ttc_table(priv->mdev, &ttc_params), false);
975 if (IS_ERR(mlx5e_fs_get_ttc(priv->fs, false))) {
976 err = PTR_ERR(mlx5e_fs_get_ttc(priv->fs, false));
977 netdev_err(priv->netdev, "Failed to create rep ttc table, err=%d\n",
978 err);
979 return err;
980 }
981 return 0;
982 }
983
mlx5e_create_rep_root_ft(struct mlx5e_priv * priv)984 static int mlx5e_create_rep_root_ft(struct mlx5e_priv *priv)
985 {
986 struct mlx5e_rep_priv *rpriv = priv->ppriv;
987 struct mlx5_eswitch_rep *rep = rpriv->rep;
988 struct mlx5_flow_table_attr ft_attr = {};
989 struct mlx5_flow_namespace *ns;
990 int err = 0;
991
992 if (rep->vport != MLX5_VPORT_UPLINK) {
993 /* non uplik reps will skip any bypass tables and go directly to
994 * their own ttc
995 */
996 rpriv->root_ft = mlx5_get_ttc_flow_table(mlx5e_fs_get_ttc(priv->fs, false));
997 return 0;
998 }
999
1000 /* uplink root ft will be used to auto chain, to ethtool or ttc tables */
1001 ns = mlx5_get_flow_namespace(priv->mdev, MLX5_FLOW_NAMESPACE_OFFLOADS);
1002 if (!ns) {
1003 netdev_err(priv->netdev, "Failed to get reps offloads namespace\n");
1004 return -EOPNOTSUPP;
1005 }
1006
1007 ft_attr.max_fte = 0; /* Empty table, miss rule will always point to next table */
1008 ft_attr.prio = 1;
1009 ft_attr.level = 1;
1010
1011 rpriv->root_ft = mlx5_create_flow_table(ns, &ft_attr);
1012 if (IS_ERR(rpriv->root_ft)) {
1013 err = PTR_ERR(rpriv->root_ft);
1014 rpriv->root_ft = NULL;
1015 }
1016
1017 return err;
1018 }
1019
mlx5e_destroy_rep_root_ft(struct mlx5e_priv * priv)1020 static void mlx5e_destroy_rep_root_ft(struct mlx5e_priv *priv)
1021 {
1022 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1023 struct mlx5_eswitch_rep *rep = rpriv->rep;
1024
1025 if (rep->vport != MLX5_VPORT_UPLINK)
1026 return;
1027 mlx5_destroy_flow_table(rpriv->root_ft);
1028 }
1029
mlx5e_create_rep_vport_rx_rule(struct mlx5e_priv * priv)1030 static int mlx5e_create_rep_vport_rx_rule(struct mlx5e_priv *priv)
1031 {
1032 struct mlx5_eswitch *esw = priv->mdev->priv.eswitch;
1033 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1034 struct mlx5_eswitch_rep *rep = rpriv->rep;
1035 struct mlx5_flow_handle *flow_rule;
1036 struct mlx5_flow_destination dest;
1037
1038 dest.type = MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE;
1039 dest.ft = rpriv->root_ft;
1040
1041 flow_rule = mlx5_eswitch_create_vport_rx_rule(esw, rep->vport, &dest);
1042 if (IS_ERR(flow_rule))
1043 return PTR_ERR(flow_rule);
1044 rpriv->vport_rx_rule = flow_rule;
1045 return 0;
1046 }
1047
rep_vport_rx_rule_destroy(struct mlx5e_priv * priv)1048 static void rep_vport_rx_rule_destroy(struct mlx5e_priv *priv)
1049 {
1050 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1051
1052 if (!rpriv->vport_rx_rule)
1053 return;
1054
1055 mlx5_del_flow_rules(rpriv->vport_rx_rule);
1056 rpriv->vport_rx_rule = NULL;
1057 }
1058
mlx5e_rep_bond_update(struct mlx5e_priv * priv,bool cleanup)1059 int mlx5e_rep_bond_update(struct mlx5e_priv *priv, bool cleanup)
1060 {
1061 rep_vport_rx_rule_destroy(priv);
1062
1063 return cleanup ? 0 : mlx5e_create_rep_vport_rx_rule(priv);
1064 }
1065
mlx5e_init_rep_rx(struct mlx5e_priv * priv)1066 static int mlx5e_init_rep_rx(struct mlx5e_priv *priv)
1067 {
1068 struct mlx5_core_dev *mdev = priv->mdev;
1069 int err;
1070
1071 mlx5e_fs_init_l2_addr(priv->fs, priv->netdev);
1072
1073 err = mlx5e_open_drop_rq(priv, &priv->drop_rq);
1074 if (err) {
1075 mlx5_core_err(mdev, "open drop rq failed, %d\n", err);
1076 goto err_free_fs;
1077 }
1078
1079 priv->rx_res = mlx5e_rx_res_create(priv->mdev, 0, priv->max_nch, priv->drop_rq.rqn,
1080 &priv->channels.params.packet_merge,
1081 priv->channels.params.num_channels);
1082 if (IS_ERR(priv->rx_res)) {
1083 err = PTR_ERR(priv->rx_res);
1084 mlx5_core_err(mdev, "Create rx resources failed, err=%d\n", err);
1085 goto err_close_drop_rq;
1086 }
1087
1088 err = mlx5e_create_rep_ttc_table(priv);
1089 if (err)
1090 goto err_destroy_rx_res;
1091
1092 err = mlx5e_create_rep_root_ft(priv);
1093 if (err)
1094 goto err_destroy_ttc_table;
1095
1096 err = mlx5e_create_rep_vport_rx_rule(priv);
1097 if (err)
1098 goto err_destroy_root_ft;
1099
1100 mlx5e_ethtool_init_steering(priv->fs);
1101
1102 return 0;
1103
1104 err_destroy_root_ft:
1105 mlx5e_destroy_rep_root_ft(priv);
1106 err_destroy_ttc_table:
1107 mlx5_destroy_ttc_table(mlx5e_fs_get_ttc(priv->fs, false));
1108 err_destroy_rx_res:
1109 mlx5e_rx_res_destroy(priv->rx_res);
1110 priv->rx_res = ERR_PTR(-EINVAL);
1111 err_close_drop_rq:
1112 mlx5e_close_drop_rq(&priv->drop_rq);
1113 err_free_fs:
1114 mlx5e_fs_cleanup(priv->fs);
1115 priv->fs = NULL;
1116 return err;
1117 }
1118
mlx5e_cleanup_rep_rx(struct mlx5e_priv * priv)1119 static void mlx5e_cleanup_rep_rx(struct mlx5e_priv *priv)
1120 {
1121 mlx5e_ethtool_cleanup_steering(priv->fs);
1122 rep_vport_rx_rule_destroy(priv);
1123 mlx5e_destroy_rep_root_ft(priv);
1124 mlx5_destroy_ttc_table(mlx5e_fs_get_ttc(priv->fs, false));
1125 mlx5e_rx_res_destroy(priv->rx_res);
1126 priv->rx_res = ERR_PTR(-EINVAL);
1127 mlx5e_close_drop_rq(&priv->drop_rq);
1128 }
1129
mlx5e_rep_mpesw_work(struct work_struct * work)1130 static void mlx5e_rep_mpesw_work(struct work_struct *work)
1131 {
1132 struct mlx5_rep_uplink_priv *uplink_priv =
1133 container_of(work, struct mlx5_rep_uplink_priv,
1134 mpesw_work);
1135 struct mlx5e_rep_priv *rpriv =
1136 container_of(uplink_priv, struct mlx5e_rep_priv,
1137 uplink_priv);
1138 struct mlx5e_priv *priv = netdev_priv(rpriv->netdev);
1139
1140 rep_vport_rx_rule_destroy(priv);
1141 mlx5e_create_rep_vport_rx_rule(priv);
1142 }
1143
mlx5e_init_ul_rep_rx(struct mlx5e_priv * priv)1144 static int mlx5e_init_ul_rep_rx(struct mlx5e_priv *priv)
1145 {
1146 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1147 int err;
1148
1149 mlx5e_create_q_counters(priv);
1150 err = mlx5e_init_rep_rx(priv);
1151 if (err)
1152 goto out;
1153
1154 mlx5e_tc_int_port_init_rep_rx(priv);
1155
1156 INIT_WORK(&rpriv->uplink_priv.mpesw_work, mlx5e_rep_mpesw_work);
1157
1158 out:
1159 return err;
1160 }
1161
mlx5e_cleanup_ul_rep_rx(struct mlx5e_priv * priv)1162 static void mlx5e_cleanup_ul_rep_rx(struct mlx5e_priv *priv)
1163 {
1164 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1165
1166 cancel_work_sync(&rpriv->uplink_priv.mpesw_work);
1167 mlx5e_tc_int_port_cleanup_rep_rx(priv);
1168 mlx5e_cleanup_rep_rx(priv);
1169 mlx5e_destroy_q_counters(priv);
1170 }
1171
mlx5e_init_uplink_rep_tx(struct mlx5e_rep_priv * rpriv)1172 static int mlx5e_init_uplink_rep_tx(struct mlx5e_rep_priv *rpriv)
1173 {
1174 struct mlx5_rep_uplink_priv *uplink_priv;
1175 struct net_device *netdev;
1176 struct mlx5e_priv *priv;
1177 int err;
1178
1179 netdev = rpriv->netdev;
1180 priv = netdev_priv(netdev);
1181 uplink_priv = &rpriv->uplink_priv;
1182
1183 err = mlx5e_rep_tc_init(rpriv);
1184 if (err)
1185 return err;
1186
1187 mlx5_init_port_tun_entropy(&uplink_priv->tun_entropy, priv->mdev);
1188
1189 mlx5e_rep_bond_init(rpriv);
1190 err = mlx5e_rep_tc_netdevice_event_register(rpriv);
1191 if (err) {
1192 mlx5_core_err(priv->mdev, "Failed to register netdev notifier, err: %d\n",
1193 err);
1194 goto err_event_reg;
1195 }
1196
1197 return 0;
1198
1199 err_event_reg:
1200 mlx5e_rep_bond_cleanup(rpriv);
1201 mlx5e_rep_tc_cleanup(rpriv);
1202 return err;
1203 }
1204
mlx5e_cleanup_uplink_rep_tx(struct mlx5e_rep_priv * rpriv)1205 static void mlx5e_cleanup_uplink_rep_tx(struct mlx5e_rep_priv *rpriv)
1206 {
1207 mlx5e_rep_tc_netdevice_event_unregister(rpriv);
1208 mlx5e_rep_bond_cleanup(rpriv);
1209 mlx5e_rep_tc_cleanup(rpriv);
1210 }
1211
mlx5e_init_rep_tx(struct mlx5e_priv * priv)1212 static int mlx5e_init_rep_tx(struct mlx5e_priv *priv)
1213 {
1214 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1215 int err;
1216
1217 err = mlx5e_rep_neigh_init(rpriv);
1218 if (err)
1219 goto err_neigh_init;
1220
1221 if (rpriv->rep->vport == MLX5_VPORT_UPLINK) {
1222 err = mlx5e_init_uplink_rep_tx(rpriv);
1223 if (err)
1224 goto err_init_tx;
1225 }
1226
1227 err = mlx5e_tc_ht_init(&rpriv->tc_ht);
1228 if (err)
1229 goto err_ht_init;
1230
1231 return 0;
1232
1233 err_ht_init:
1234 if (rpriv->rep->vport == MLX5_VPORT_UPLINK)
1235 mlx5e_cleanup_uplink_rep_tx(rpriv);
1236 err_init_tx:
1237 mlx5e_rep_neigh_cleanup(rpriv);
1238 err_neigh_init:
1239 return err;
1240 }
1241
mlx5e_cleanup_rep_tx(struct mlx5e_priv * priv)1242 static void mlx5e_cleanup_rep_tx(struct mlx5e_priv *priv)
1243 {
1244 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1245
1246 mlx5e_tc_ht_cleanup(&rpriv->tc_ht);
1247
1248 if (rpriv->rep->vport == MLX5_VPORT_UPLINK)
1249 mlx5e_cleanup_uplink_rep_tx(rpriv);
1250
1251 mlx5e_rep_neigh_cleanup(rpriv);
1252 }
1253
mlx5e_rep_enable(struct mlx5e_priv * priv)1254 static void mlx5e_rep_enable(struct mlx5e_priv *priv)
1255 {
1256 mlx5e_set_netdev_mtu_boundaries(priv);
1257 }
1258
mlx5e_rep_disable(struct mlx5e_priv * priv)1259 static void mlx5e_rep_disable(struct mlx5e_priv *priv)
1260 {
1261 }
1262
mlx5e_update_rep_rx(struct mlx5e_priv * priv)1263 static int mlx5e_update_rep_rx(struct mlx5e_priv *priv)
1264 {
1265 return 0;
1266 }
1267
mlx5e_rep_stats_update_ndo_stats(struct mlx5e_priv * priv)1268 static void mlx5e_rep_stats_update_ndo_stats(struct mlx5e_priv *priv)
1269 {
1270 mlx5e_stats_update_ndo_stats(priv);
1271 mlx5e_rep_update_vport_q_counter(priv);
1272 }
1273
mlx5e_rep_event_mpesw(struct mlx5e_priv * priv)1274 static int mlx5e_rep_event_mpesw(struct mlx5e_priv *priv)
1275 {
1276 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1277 struct mlx5_eswitch_rep *rep = rpriv->rep;
1278
1279 if (rep->vport != MLX5_VPORT_UPLINK)
1280 return NOTIFY_DONE;
1281
1282 queue_work(priv->wq, &rpriv->uplink_priv.mpesw_work);
1283
1284 return NOTIFY_OK;
1285 }
1286
uplink_rep_async_event(struct notifier_block * nb,unsigned long event,void * data)1287 static int uplink_rep_async_event(struct notifier_block *nb, unsigned long event, void *data)
1288 {
1289 struct mlx5e_priv *priv = container_of(nb, struct mlx5e_priv, events_nb);
1290
1291 if (event == MLX5_EVENT_TYPE_PORT_CHANGE) {
1292 struct mlx5_eqe *eqe = data;
1293
1294 switch (eqe->sub_type) {
1295 case MLX5_PORT_CHANGE_SUBTYPE_DOWN:
1296 case MLX5_PORT_CHANGE_SUBTYPE_ACTIVE:
1297 queue_work(priv->wq, &priv->update_carrier_work);
1298 break;
1299 default:
1300 return NOTIFY_DONE;
1301 }
1302
1303 return NOTIFY_OK;
1304 }
1305
1306 if (event == MLX5_DEV_EVENT_PORT_AFFINITY)
1307 return mlx5e_rep_tc_event_port_affinity(priv);
1308 else if (event == MLX5_DEV_EVENT_MULTIPORT_ESW)
1309 return mlx5e_rep_event_mpesw(priv);
1310
1311 return NOTIFY_DONE;
1312 }
1313
mlx5e_uplink_rep_enable(struct mlx5e_priv * priv)1314 static void mlx5e_uplink_rep_enable(struct mlx5e_priv *priv)
1315 {
1316 struct net_device *netdev = priv->netdev;
1317 struct mlx5_core_dev *mdev = priv->mdev;
1318 u16 max_mtu;
1319
1320 mlx5e_ipsec_init(priv);
1321
1322 netdev->min_mtu = ETH_MIN_MTU;
1323 mlx5_query_port_max_mtu(priv->mdev, &max_mtu, 1);
1324 netdev->max_mtu = MLX5E_HW2SW_MTU(&priv->channels.params, max_mtu);
1325 mlx5e_set_dev_port_mtu(priv);
1326
1327 mlx5e_rep_tc_enable(priv);
1328
1329 if (MLX5_CAP_GEN(mdev, uplink_follow))
1330 mlx5_modify_vport_admin_state(mdev, MLX5_VPORT_STATE_OP_MOD_UPLINK,
1331 0, 0, MLX5_VPORT_ADMIN_STATE_AUTO);
1332 mlx5_lag_add_netdev(mdev, netdev);
1333 priv->events_nb.notifier_call = uplink_rep_async_event;
1334 mlx5_notifier_register(mdev, &priv->events_nb);
1335 mlx5e_dcbnl_initialize(priv);
1336 mlx5e_dcbnl_init_app(priv);
1337 mlx5e_rep_bridge_init(priv);
1338
1339 netdev->wanted_features |= NETIF_F_HW_TC;
1340
1341 rtnl_lock();
1342 if (netif_running(netdev))
1343 mlx5e_open(netdev);
1344 udp_tunnel_nic_reset_ntf(priv->netdev);
1345 netif_device_attach(netdev);
1346 rtnl_unlock();
1347 }
1348
mlx5e_uplink_rep_disable(struct mlx5e_priv * priv)1349 static void mlx5e_uplink_rep_disable(struct mlx5e_priv *priv)
1350 {
1351 struct mlx5_core_dev *mdev = priv->mdev;
1352
1353 rtnl_lock();
1354 if (netif_running(priv->netdev))
1355 mlx5e_close(priv->netdev);
1356 netif_device_detach(priv->netdev);
1357 rtnl_unlock();
1358
1359 mlx5e_rep_bridge_cleanup(priv);
1360 mlx5e_dcbnl_delete_app(priv);
1361 mlx5_notifier_unregister(mdev, &priv->events_nb);
1362 mlx5e_rep_tc_disable(priv);
1363 mlx5_lag_remove_netdev(mdev, priv->netdev);
1364 mlx5_vxlan_reset_to_default(mdev->vxlan);
1365
1366 mlx5e_ipsec_cleanup(priv);
1367 }
1368
1369 static MLX5E_DEFINE_STATS_GRP(sw_rep, 0);
1370 static MLX5E_DEFINE_STATS_GRP(vport_rep, MLX5E_NDO_UPDATE_STATS);
1371
1372 /* The stats groups order is opposite to the update_stats() order calls */
1373 static mlx5e_stats_grp_t mlx5e_rep_stats_grps[] = {
1374 &MLX5E_STATS_GRP(sw_rep),
1375 &MLX5E_STATS_GRP(vport_rep),
1376 };
1377
mlx5e_rep_stats_grps_num(struct mlx5e_priv * priv)1378 static unsigned int mlx5e_rep_stats_grps_num(struct mlx5e_priv *priv)
1379 {
1380 return ARRAY_SIZE(mlx5e_rep_stats_grps);
1381 }
1382
1383 /* The stats groups order is opposite to the update_stats() order calls */
1384 static mlx5e_stats_grp_t mlx5e_ul_rep_stats_grps[] = {
1385 &MLX5E_STATS_GRP(sw),
1386 &MLX5E_STATS_GRP(qcnt),
1387 &MLX5E_STATS_GRP(vnic_env),
1388 &MLX5E_STATS_GRP(vport),
1389 &MLX5E_STATS_GRP(802_3),
1390 &MLX5E_STATS_GRP(2863),
1391 &MLX5E_STATS_GRP(2819),
1392 &MLX5E_STATS_GRP(phy),
1393 &MLX5E_STATS_GRP(eth_ext),
1394 &MLX5E_STATS_GRP(pcie),
1395 &MLX5E_STATS_GRP(per_prio),
1396 &MLX5E_STATS_GRP(pme),
1397 &MLX5E_STATS_GRP(channels),
1398 &MLX5E_STATS_GRP(per_port_buff_congest),
1399 #ifdef CONFIG_MLX5_EN_IPSEC
1400 &MLX5E_STATS_GRP(ipsec_hw),
1401 &MLX5E_STATS_GRP(ipsec_sw),
1402 #endif
1403 &MLX5E_STATS_GRP(ptp),
1404 };
1405
mlx5e_ul_rep_stats_grps_num(struct mlx5e_priv * priv)1406 static unsigned int mlx5e_ul_rep_stats_grps_num(struct mlx5e_priv *priv)
1407 {
1408 return ARRAY_SIZE(mlx5e_ul_rep_stats_grps);
1409 }
1410
1411 static int
mlx5e_rep_vnic_reporter_diagnose(struct devlink_health_reporter * reporter,struct devlink_fmsg * fmsg,struct netlink_ext_ack * extack)1412 mlx5e_rep_vnic_reporter_diagnose(struct devlink_health_reporter *reporter,
1413 struct devlink_fmsg *fmsg,
1414 struct netlink_ext_ack *extack)
1415 {
1416 struct mlx5e_rep_priv *rpriv = devlink_health_reporter_priv(reporter);
1417 struct mlx5_eswitch_rep *rep = rpriv->rep;
1418
1419 mlx5_reporter_vnic_diagnose_counters(rep->esw->dev, fmsg, rep->vport,
1420 true);
1421 return 0;
1422 }
1423
1424 static const struct devlink_health_reporter_ops mlx5_rep_vnic_reporter_ops = {
1425 .name = "vnic",
1426 .diagnose = mlx5e_rep_vnic_reporter_diagnose,
1427 };
1428
mlx5e_rep_vnic_reporter_create(struct mlx5e_priv * priv,struct devlink_port * dl_port)1429 static void mlx5e_rep_vnic_reporter_create(struct mlx5e_priv *priv,
1430 struct devlink_port *dl_port)
1431 {
1432 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1433 struct devlink_health_reporter *reporter;
1434
1435 reporter = devl_port_health_reporter_create(dl_port,
1436 &mlx5_rep_vnic_reporter_ops,
1437 0, rpriv);
1438 if (IS_ERR(reporter)) {
1439 mlx5_core_err(priv->mdev,
1440 "Failed to create representor vnic reporter, err = %ld\n",
1441 PTR_ERR(reporter));
1442 return;
1443 }
1444
1445 rpriv->rep_vnic_reporter = reporter;
1446 }
1447
mlx5e_rep_vnic_reporter_destroy(struct mlx5e_priv * priv)1448 static void mlx5e_rep_vnic_reporter_destroy(struct mlx5e_priv *priv)
1449 {
1450 struct mlx5e_rep_priv *rpriv = priv->ppriv;
1451
1452 if (!IS_ERR_OR_NULL(rpriv->rep_vnic_reporter))
1453 devl_health_reporter_destroy(rpriv->rep_vnic_reporter);
1454 }
1455
1456 static const struct mlx5e_profile mlx5e_rep_profile = {
1457 .init = mlx5e_init_rep,
1458 .cleanup = mlx5e_cleanup_rep,
1459 .init_rx = mlx5e_init_rep_rx,
1460 .cleanup_rx = mlx5e_cleanup_rep_rx,
1461 .init_tx = mlx5e_init_rep_tx,
1462 .cleanup_tx = mlx5e_cleanup_rep_tx,
1463 .enable = mlx5e_rep_enable,
1464 .disable = mlx5e_rep_disable,
1465 .update_rx = mlx5e_update_rep_rx,
1466 .update_stats = mlx5e_rep_stats_update_ndo_stats,
1467 .rx_handlers = &mlx5e_rx_handlers_rep,
1468 .max_tc = 1,
1469 .stats_grps = mlx5e_rep_stats_grps,
1470 .stats_grps_num = mlx5e_rep_stats_grps_num,
1471 .max_nch_limit = mlx5e_rep_max_nch_limit,
1472 };
1473
1474 static const struct mlx5e_profile mlx5e_uplink_rep_profile = {
1475 .init = mlx5e_init_ul_rep,
1476 .cleanup = mlx5e_cleanup_rep,
1477 .init_rx = mlx5e_init_ul_rep_rx,
1478 .cleanup_rx = mlx5e_cleanup_ul_rep_rx,
1479 .init_tx = mlx5e_init_rep_tx,
1480 .cleanup_tx = mlx5e_cleanup_rep_tx,
1481 .enable = mlx5e_uplink_rep_enable,
1482 .disable = mlx5e_uplink_rep_disable,
1483 .update_rx = mlx5e_update_rep_rx,
1484 .update_stats = mlx5e_stats_update_ndo_stats,
1485 .update_carrier = mlx5e_update_carrier,
1486 .rx_handlers = &mlx5e_rx_handlers_rep,
1487 .max_tc = MLX5_MAX_NUM_TC,
1488 .stats_grps = mlx5e_ul_rep_stats_grps,
1489 .stats_grps_num = mlx5e_ul_rep_stats_grps_num,
1490 };
1491
1492 /* e-Switch vport representors */
1493 static int
mlx5e_vport_uplink_rep_load(struct mlx5_core_dev * dev,struct mlx5_eswitch_rep * rep)1494 mlx5e_vport_uplink_rep_load(struct mlx5_core_dev *dev, struct mlx5_eswitch_rep *rep)
1495 {
1496 struct mlx5e_priv *priv = netdev_priv(mlx5_uplink_netdev_get(dev));
1497 struct mlx5e_rep_priv *rpriv = mlx5e_rep_to_rep_priv(rep);
1498
1499 rpriv->netdev = priv->netdev;
1500 return mlx5e_netdev_change_profile(priv, &mlx5e_uplink_rep_profile,
1501 rpriv);
1502 }
1503
1504 static void
mlx5e_vport_uplink_rep_unload(struct mlx5e_rep_priv * rpriv)1505 mlx5e_vport_uplink_rep_unload(struct mlx5e_rep_priv *rpriv)
1506 {
1507 struct net_device *netdev = rpriv->netdev;
1508 struct mlx5e_priv *priv;
1509
1510 priv = netdev_priv(netdev);
1511
1512 /* This bit is set when using devlink to change eswitch mode from
1513 * switchdev to legacy. As need to keep uplink netdev ifindex, we
1514 * detach uplink representor profile and attach NIC profile only.
1515 * The netdev will be unregistered later when unload NIC auxiliary
1516 * driver for this case.
1517 * We explicitly block devlink eswitch mode change if any IPSec rules
1518 * offloaded, but can't block other cases, such as driver unload
1519 * and devlink reload. We have to unregister netdev before profile
1520 * change for those cases. This is to avoid resource leak because
1521 * the offloaded rules don't have the chance to be unoffloaded before
1522 * cleanup which is triggered by detach uplink representor profile.
1523 */
1524 if (!(priv->mdev->priv.flags & MLX5_PRIV_FLAGS_SWITCH_LEGACY))
1525 unregister_netdev(netdev);
1526
1527 mlx5e_netdev_attach_nic_profile(priv);
1528 }
1529
1530 static int
mlx5e_vport_vf_rep_load(struct mlx5_core_dev * dev,struct mlx5_eswitch_rep * rep)1531 mlx5e_vport_vf_rep_load(struct mlx5_core_dev *dev, struct mlx5_eswitch_rep *rep)
1532 {
1533 struct mlx5e_rep_priv *rpriv = mlx5e_rep_to_rep_priv(rep);
1534 const struct mlx5e_profile *profile;
1535 struct devlink_port *dl_port;
1536 struct net_device *netdev;
1537 struct mlx5e_priv *priv;
1538 int err;
1539
1540 profile = &mlx5e_rep_profile;
1541 netdev = mlx5e_create_netdev(dev, profile);
1542 if (!netdev) {
1543 mlx5_core_warn(dev,
1544 "Failed to create representor netdev for vport %d\n",
1545 rep->vport);
1546 return -EINVAL;
1547 }
1548
1549 mlx5e_build_rep_netdev(netdev, dev);
1550 rpriv->netdev = netdev;
1551
1552 priv = netdev_priv(netdev);
1553 priv->profile = profile;
1554 priv->ppriv = rpriv;
1555 err = profile->init(dev, netdev);
1556 if (err) {
1557 netdev_warn(netdev, "rep profile init failed, %d\n", err);
1558 goto err_destroy_netdev;
1559 }
1560
1561 err = mlx5e_attach_netdev(netdev_priv(netdev));
1562 if (err) {
1563 netdev_warn(netdev,
1564 "Failed to attach representor netdev for vport %d\n",
1565 rep->vport);
1566 goto err_cleanup_profile;
1567 }
1568
1569 dl_port = mlx5_esw_offloads_devlink_port(dev->priv.eswitch,
1570 rpriv->rep->vport);
1571 if (!IS_ERR(dl_port)) {
1572 SET_NETDEV_DEVLINK_PORT(netdev, dl_port);
1573 mlx5e_rep_vnic_reporter_create(priv, dl_port);
1574 }
1575
1576 err = register_netdev(netdev);
1577 if (err) {
1578 netdev_warn(netdev,
1579 "Failed to register representor netdev for vport %d\n",
1580 rep->vport);
1581 goto err_detach_netdev;
1582 }
1583
1584 return 0;
1585
1586 err_detach_netdev:
1587 mlx5e_rep_vnic_reporter_destroy(priv);
1588 mlx5e_detach_netdev(netdev_priv(netdev));
1589 err_cleanup_profile:
1590 priv->profile->cleanup(priv);
1591
1592 err_destroy_netdev:
1593 mlx5e_destroy_netdev(netdev_priv(netdev));
1594 return err;
1595 }
1596
1597 static int
mlx5e_vport_rep_load(struct mlx5_core_dev * dev,struct mlx5_eswitch_rep * rep)1598 mlx5e_vport_rep_load(struct mlx5_core_dev *dev, struct mlx5_eswitch_rep *rep)
1599 {
1600 struct mlx5e_rep_priv *rpriv;
1601 int err;
1602
1603 rpriv = kvzalloc(sizeof(*rpriv), GFP_KERNEL);
1604 if (!rpriv)
1605 return -ENOMEM;
1606
1607 /* rpriv->rep to be looked up when profile->init() is called */
1608 rpriv->rep = rep;
1609 rep->rep_data[REP_ETH].priv = rpriv;
1610 INIT_LIST_HEAD(&rpriv->vport_sqs_list);
1611
1612 if (rep->vport == MLX5_VPORT_UPLINK)
1613 err = mlx5e_vport_uplink_rep_load(dev, rep);
1614 else
1615 err = mlx5e_vport_vf_rep_load(dev, rep);
1616
1617 if (err)
1618 kvfree(rpriv);
1619
1620 return err;
1621 }
1622
1623 static void
mlx5e_vport_rep_unload(struct mlx5_eswitch_rep * rep)1624 mlx5e_vport_rep_unload(struct mlx5_eswitch_rep *rep)
1625 {
1626 struct mlx5e_rep_priv *rpriv = mlx5e_rep_to_rep_priv(rep);
1627 struct net_device *netdev = rpriv->netdev;
1628 struct mlx5e_priv *priv = netdev_priv(netdev);
1629 void *ppriv = priv->ppriv;
1630
1631 if (rep->vport == MLX5_VPORT_UPLINK) {
1632 mlx5e_vport_uplink_rep_unload(rpriv);
1633 goto free_ppriv;
1634 }
1635
1636 unregister_netdev(netdev);
1637 mlx5e_rep_vnic_reporter_destroy(priv);
1638 mlx5e_detach_netdev(priv);
1639 priv->profile->cleanup(priv);
1640 mlx5e_destroy_netdev(priv);
1641 free_ppriv:
1642 kvfree(ppriv); /* mlx5e_rep_priv */
1643 }
1644
mlx5e_vport_rep_get_proto_dev(struct mlx5_eswitch_rep * rep)1645 static void *mlx5e_vport_rep_get_proto_dev(struct mlx5_eswitch_rep *rep)
1646 {
1647 struct mlx5e_rep_priv *rpriv;
1648
1649 rpriv = mlx5e_rep_to_rep_priv(rep);
1650
1651 return rpriv->netdev;
1652 }
1653
mlx5e_vport_rep_event_unpair(struct mlx5_eswitch_rep * rep,struct mlx5_eswitch * peer_esw)1654 static void mlx5e_vport_rep_event_unpair(struct mlx5_eswitch_rep *rep,
1655 struct mlx5_eswitch *peer_esw)
1656 {
1657 u16 i = MLX5_CAP_GEN(peer_esw->dev, vhca_id);
1658 struct mlx5e_rep_priv *rpriv;
1659 struct mlx5e_rep_sq *rep_sq;
1660
1661 WARN_ON_ONCE(!peer_esw);
1662 rpriv = mlx5e_rep_to_rep_priv(rep);
1663 list_for_each_entry(rep_sq, &rpriv->vport_sqs_list, list) {
1664 struct mlx5e_rep_sq_peer *sq_peer = xa_load(&rep_sq->sq_peer, i);
1665
1666 if (!sq_peer || sq_peer->peer != peer_esw)
1667 continue;
1668
1669 mlx5_eswitch_del_send_to_vport_rule(sq_peer->rule);
1670 xa_erase(&rep_sq->sq_peer, i);
1671 kfree(sq_peer);
1672 }
1673 }
1674
mlx5e_vport_rep_event_pair(struct mlx5_eswitch * esw,struct mlx5_eswitch_rep * rep,struct mlx5_eswitch * peer_esw)1675 static int mlx5e_vport_rep_event_pair(struct mlx5_eswitch *esw,
1676 struct mlx5_eswitch_rep *rep,
1677 struct mlx5_eswitch *peer_esw)
1678 {
1679 u16 i = MLX5_CAP_GEN(peer_esw->dev, vhca_id);
1680 struct mlx5_flow_handle *flow_rule;
1681 struct mlx5e_rep_sq_peer *sq_peer;
1682 struct mlx5e_rep_priv *rpriv;
1683 struct mlx5e_rep_sq *rep_sq;
1684 int err;
1685
1686 rpriv = mlx5e_rep_to_rep_priv(rep);
1687 list_for_each_entry(rep_sq, &rpriv->vport_sqs_list, list) {
1688 sq_peer = xa_load(&rep_sq->sq_peer, i);
1689
1690 if (sq_peer && sq_peer->peer)
1691 continue;
1692
1693 flow_rule = mlx5_eswitch_add_send_to_vport_rule(peer_esw, esw, rep,
1694 rep_sq->sqn);
1695 if (IS_ERR(flow_rule)) {
1696 err = PTR_ERR(flow_rule);
1697 goto err_out;
1698 }
1699
1700 if (sq_peer) {
1701 sq_peer->rule = flow_rule;
1702 sq_peer->peer = peer_esw;
1703 continue;
1704 }
1705 sq_peer = kzalloc(sizeof(*sq_peer), GFP_KERNEL);
1706 if (!sq_peer) {
1707 err = -ENOMEM;
1708 goto err_sq_alloc;
1709 }
1710 err = xa_insert(&rep_sq->sq_peer, i, sq_peer, GFP_KERNEL);
1711 if (err)
1712 goto err_xa;
1713 sq_peer->rule = flow_rule;
1714 sq_peer->peer = peer_esw;
1715 }
1716
1717 return 0;
1718 err_xa:
1719 kfree(sq_peer);
1720 err_sq_alloc:
1721 mlx5_eswitch_del_send_to_vport_rule(flow_rule);
1722 err_out:
1723 mlx5e_vport_rep_event_unpair(rep, peer_esw);
1724 return err;
1725 }
1726
mlx5e_vport_rep_event(struct mlx5_eswitch * esw,struct mlx5_eswitch_rep * rep,enum mlx5_switchdev_event event,void * data)1727 static int mlx5e_vport_rep_event(struct mlx5_eswitch *esw,
1728 struct mlx5_eswitch_rep *rep,
1729 enum mlx5_switchdev_event event,
1730 void *data)
1731 {
1732 int err = 0;
1733
1734 if (event == MLX5_SWITCHDEV_EVENT_PAIR)
1735 err = mlx5e_vport_rep_event_pair(esw, rep, data);
1736 else if (event == MLX5_SWITCHDEV_EVENT_UNPAIR)
1737 mlx5e_vport_rep_event_unpair(rep, data);
1738
1739 return err;
1740 }
1741
1742 static const struct mlx5_eswitch_rep_ops rep_ops = {
1743 .load = mlx5e_vport_rep_load,
1744 .unload = mlx5e_vport_rep_unload,
1745 .get_proto_dev = mlx5e_vport_rep_get_proto_dev,
1746 .event = mlx5e_vport_rep_event,
1747 };
1748
mlx5e_rep_probe(struct auxiliary_device * adev,const struct auxiliary_device_id * id)1749 static int mlx5e_rep_probe(struct auxiliary_device *adev,
1750 const struct auxiliary_device_id *id)
1751 {
1752 struct mlx5_adev *edev = container_of(adev, struct mlx5_adev, adev);
1753 struct mlx5_core_dev *mdev = edev->mdev;
1754 struct mlx5_eswitch *esw;
1755
1756 esw = mdev->priv.eswitch;
1757 mlx5_eswitch_register_vport_reps(esw, &rep_ops, REP_ETH);
1758 return 0;
1759 }
1760
mlx5e_rep_remove(struct auxiliary_device * adev)1761 static void mlx5e_rep_remove(struct auxiliary_device *adev)
1762 {
1763 struct mlx5_adev *vdev = container_of(adev, struct mlx5_adev, adev);
1764 struct mlx5_core_dev *mdev = vdev->mdev;
1765 struct mlx5_eswitch *esw;
1766
1767 esw = mdev->priv.eswitch;
1768 mlx5_eswitch_unregister_vport_reps(esw, REP_ETH);
1769 }
1770
1771 static const struct auxiliary_device_id mlx5e_rep_id_table[] = {
1772 { .name = MLX5_ADEV_NAME ".eth-rep", },
1773 {},
1774 };
1775
1776 MODULE_DEVICE_TABLE(auxiliary, mlx5e_rep_id_table);
1777
1778 static struct auxiliary_driver mlx5e_rep_driver = {
1779 .name = "eth-rep",
1780 .probe = mlx5e_rep_probe,
1781 .remove = mlx5e_rep_remove,
1782 .id_table = mlx5e_rep_id_table,
1783 };
1784
mlx5e_rep_init(void)1785 int mlx5e_rep_init(void)
1786 {
1787 return auxiliary_driver_register(&mlx5e_rep_driver);
1788 }
1789
mlx5e_rep_cleanup(void)1790 void mlx5e_rep_cleanup(void)
1791 {
1792 auxiliary_driver_unregister(&mlx5e_rep_driver);
1793 }
1794