1 /* 2 * Copyright (C) 2016-2018 Netronome Systems, Inc. 3 * 4 * This software is dual licensed under the GNU General License Version 2, 5 * June 1991 as shown in the file COPYING in the top-level directory of this 6 * source tree or the BSD 2-Clause License provided below. You have the 7 * option to license this software under the complete terms of either license. 8 * 9 * The BSD 2-Clause License: 10 * 11 * Redistribution and use in source and binary forms, with or 12 * without modification, are permitted provided that the following 13 * conditions are met: 14 * 15 * 1. Redistributions of source code must retain the above 16 * copyright notice, this list of conditions and the following 17 * disclaimer. 18 * 19 * 2. Redistributions in binary form must reproduce the above 20 * copyright notice, this list of conditions and the following 21 * disclaimer in the documentation and/or other materials 22 * provided with the distribution. 23 * 24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 31 * SOFTWARE. 32 */ 33 34 /* 35 * nfp_net_offload.c 36 * Netronome network device driver: TC offload functions for PF and VF 37 */ 38 39 #define pr_fmt(fmt) "NFP net bpf: " fmt 40 41 #include <linux/bpf.h> 42 #include <linux/kernel.h> 43 #include <linux/netdevice.h> 44 #include <linux/pci.h> 45 #include <linux/jiffies.h> 46 #include <linux/timer.h> 47 #include <linux/list.h> 48 #include <linux/mm.h> 49 50 #include <net/pkt_cls.h> 51 #include <net/tc_act/tc_gact.h> 52 #include <net/tc_act/tc_mirred.h> 53 54 #include "main.h" 55 #include "../nfp_app.h" 56 #include "../nfp_net_ctrl.h" 57 #include "../nfp_net.h" 58 59 static int 60 nfp_map_ptr_record(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog, 61 struct bpf_map *map) 62 { 63 struct nfp_bpf_neutral_map *record; 64 int err; 65 66 /* Map record paths are entered via ndo, update side is protected. */ 67 ASSERT_RTNL(); 68 69 /* Reuse path - other offloaded program is already tracking this map. */ 70 record = rhashtable_lookup_fast(&bpf->maps_neutral, &map->id, 71 nfp_bpf_maps_neutral_params); 72 if (record) { 73 nfp_prog->map_records[nfp_prog->map_records_cnt++] = record; 74 record->count++; 75 return 0; 76 } 77 78 /* Grab a single ref to the map for our record. The prog destroy ndo 79 * happens after free_used_maps(). 80 */ 81 map = bpf_map_inc(map, false); 82 if (IS_ERR(map)) 83 return PTR_ERR(map); 84 85 record = kmalloc(sizeof(*record), GFP_KERNEL); 86 if (!record) { 87 err = -ENOMEM; 88 goto err_map_put; 89 } 90 91 record->ptr = map; 92 record->map_id = map->id; 93 record->count = 1; 94 95 err = rhashtable_insert_fast(&bpf->maps_neutral, &record->l, 96 nfp_bpf_maps_neutral_params); 97 if (err) 98 goto err_free_rec; 99 100 nfp_prog->map_records[nfp_prog->map_records_cnt++] = record; 101 102 return 0; 103 104 err_free_rec: 105 kfree(record); 106 err_map_put: 107 bpf_map_put(map); 108 return err; 109 } 110 111 static void 112 nfp_map_ptrs_forget(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog) 113 { 114 bool freed = false; 115 int i; 116 117 ASSERT_RTNL(); 118 119 for (i = 0; i < nfp_prog->map_records_cnt; i++) { 120 if (--nfp_prog->map_records[i]->count) { 121 nfp_prog->map_records[i] = NULL; 122 continue; 123 } 124 125 WARN_ON(rhashtable_remove_fast(&bpf->maps_neutral, 126 &nfp_prog->map_records[i]->l, 127 nfp_bpf_maps_neutral_params)); 128 freed = true; 129 } 130 131 if (freed) { 132 synchronize_rcu(); 133 134 for (i = 0; i < nfp_prog->map_records_cnt; i++) 135 if (nfp_prog->map_records[i]) { 136 bpf_map_put(nfp_prog->map_records[i]->ptr); 137 kfree(nfp_prog->map_records[i]); 138 } 139 } 140 141 kfree(nfp_prog->map_records); 142 nfp_prog->map_records = NULL; 143 nfp_prog->map_records_cnt = 0; 144 } 145 146 static int 147 nfp_map_ptrs_record(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog, 148 struct bpf_prog *prog) 149 { 150 int i, cnt, err; 151 152 /* Quickly count the maps we will have to remember */ 153 cnt = 0; 154 for (i = 0; i < prog->aux->used_map_cnt; i++) 155 if (bpf_map_offload_neutral(prog->aux->used_maps[i])) 156 cnt++; 157 if (!cnt) 158 return 0; 159 160 nfp_prog->map_records = kmalloc_array(cnt, 161 sizeof(nfp_prog->map_records[0]), 162 GFP_KERNEL); 163 if (!nfp_prog->map_records) 164 return -ENOMEM; 165 166 for (i = 0; i < prog->aux->used_map_cnt; i++) 167 if (bpf_map_offload_neutral(prog->aux->used_maps[i])) { 168 err = nfp_map_ptr_record(bpf, nfp_prog, 169 prog->aux->used_maps[i]); 170 if (err) { 171 nfp_map_ptrs_forget(bpf, nfp_prog); 172 return err; 173 } 174 } 175 WARN_ON(cnt != nfp_prog->map_records_cnt); 176 177 return 0; 178 } 179 180 static int 181 nfp_prog_prepare(struct nfp_prog *nfp_prog, const struct bpf_insn *prog, 182 unsigned int cnt) 183 { 184 struct nfp_insn_meta *meta; 185 unsigned int i; 186 187 for (i = 0; i < cnt; i++) { 188 meta = kzalloc(sizeof(*meta), GFP_KERNEL); 189 if (!meta) 190 return -ENOMEM; 191 192 meta->insn = prog[i]; 193 meta->n = i; 194 if (is_mbpf_alu(meta)) { 195 meta->umin_src = U64_MAX; 196 meta->umin_dst = U64_MAX; 197 } 198 199 list_add_tail(&meta->l, &nfp_prog->insns); 200 } 201 202 nfp_bpf_jit_prepare(nfp_prog, cnt); 203 204 return 0; 205 } 206 207 static void nfp_prog_free(struct nfp_prog *nfp_prog) 208 { 209 struct nfp_insn_meta *meta, *tmp; 210 211 kfree(nfp_prog->subprog); 212 213 list_for_each_entry_safe(meta, tmp, &nfp_prog->insns, l) { 214 list_del(&meta->l); 215 kfree(meta); 216 } 217 kfree(nfp_prog); 218 } 219 220 static int 221 nfp_bpf_verifier_prep(struct nfp_app *app, struct nfp_net *nn, 222 struct netdev_bpf *bpf) 223 { 224 struct bpf_prog *prog = bpf->verifier.prog; 225 struct nfp_prog *nfp_prog; 226 int ret; 227 228 nfp_prog = kzalloc(sizeof(*nfp_prog), GFP_KERNEL); 229 if (!nfp_prog) 230 return -ENOMEM; 231 prog->aux->offload->dev_priv = nfp_prog; 232 233 INIT_LIST_HEAD(&nfp_prog->insns); 234 nfp_prog->type = prog->type; 235 nfp_prog->bpf = app->priv; 236 237 ret = nfp_prog_prepare(nfp_prog, prog->insnsi, prog->len); 238 if (ret) 239 goto err_free; 240 241 nfp_prog->verifier_meta = nfp_prog_first_meta(nfp_prog); 242 bpf->verifier.ops = &nfp_bpf_analyzer_ops; 243 244 return 0; 245 246 err_free: 247 nfp_prog_free(nfp_prog); 248 249 return ret; 250 } 251 252 static int nfp_bpf_translate(struct nfp_net *nn, struct bpf_prog *prog) 253 { 254 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv; 255 unsigned int max_instr; 256 int err; 257 258 max_instr = nn_readw(nn, NFP_NET_CFG_BPF_MAX_LEN); 259 nfp_prog->__prog_alloc_len = max_instr * sizeof(u64); 260 261 nfp_prog->prog = kvmalloc(nfp_prog->__prog_alloc_len, GFP_KERNEL); 262 if (!nfp_prog->prog) 263 return -ENOMEM; 264 265 err = nfp_bpf_jit(nfp_prog); 266 if (err) 267 return err; 268 269 prog->aux->offload->jited_len = nfp_prog->prog_len * sizeof(u64); 270 prog->aux->offload->jited_image = nfp_prog->prog; 271 272 return nfp_map_ptrs_record(nfp_prog->bpf, nfp_prog, prog); 273 } 274 275 static int nfp_bpf_destroy(struct nfp_net *nn, struct bpf_prog *prog) 276 { 277 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv; 278 279 kvfree(nfp_prog->prog); 280 nfp_map_ptrs_forget(nfp_prog->bpf, nfp_prog); 281 nfp_prog_free(nfp_prog); 282 283 return 0; 284 } 285 286 /* Atomic engine requires values to be in big endian, we need to byte swap 287 * the value words used with xadd. 288 */ 289 static void nfp_map_bpf_byte_swap(struct nfp_bpf_map *nfp_map, void *value) 290 { 291 u32 *word = value; 292 unsigned int i; 293 294 for (i = 0; i < DIV_ROUND_UP(nfp_map->offmap->map.value_size, 4); i++) 295 if (nfp_map->use_map[i] == NFP_MAP_USE_ATOMIC_CNT) 296 word[i] = (__force u32)cpu_to_be32(word[i]); 297 } 298 299 static int 300 nfp_bpf_map_lookup_entry(struct bpf_offloaded_map *offmap, 301 void *key, void *value) 302 { 303 int err; 304 305 err = nfp_bpf_ctrl_lookup_entry(offmap, key, value); 306 if (err) 307 return err; 308 309 nfp_map_bpf_byte_swap(offmap->dev_priv, value); 310 return 0; 311 } 312 313 static int 314 nfp_bpf_map_update_entry(struct bpf_offloaded_map *offmap, 315 void *key, void *value, u64 flags) 316 { 317 nfp_map_bpf_byte_swap(offmap->dev_priv, value); 318 return nfp_bpf_ctrl_update_entry(offmap, key, value, flags); 319 } 320 321 static int 322 nfp_bpf_map_get_next_key(struct bpf_offloaded_map *offmap, 323 void *key, void *next_key) 324 { 325 if (!key) 326 return nfp_bpf_ctrl_getfirst_entry(offmap, next_key); 327 return nfp_bpf_ctrl_getnext_entry(offmap, key, next_key); 328 } 329 330 static int 331 nfp_bpf_map_delete_elem(struct bpf_offloaded_map *offmap, void *key) 332 { 333 if (offmap->map.map_type == BPF_MAP_TYPE_ARRAY) 334 return -EINVAL; 335 return nfp_bpf_ctrl_del_entry(offmap, key); 336 } 337 338 static const struct bpf_map_dev_ops nfp_bpf_map_ops = { 339 .map_get_next_key = nfp_bpf_map_get_next_key, 340 .map_lookup_elem = nfp_bpf_map_lookup_entry, 341 .map_update_elem = nfp_bpf_map_update_entry, 342 .map_delete_elem = nfp_bpf_map_delete_elem, 343 }; 344 345 static int 346 nfp_bpf_map_alloc(struct nfp_app_bpf *bpf, struct bpf_offloaded_map *offmap) 347 { 348 struct nfp_bpf_map *nfp_map; 349 unsigned int use_map_size; 350 long long int res; 351 352 if (!bpf->maps.types) 353 return -EOPNOTSUPP; 354 355 if (offmap->map.map_flags || 356 offmap->map.numa_node != NUMA_NO_NODE) { 357 pr_info("map flags are not supported\n"); 358 return -EINVAL; 359 } 360 361 if (!(bpf->maps.types & 1 << offmap->map.map_type)) { 362 pr_info("map type not supported\n"); 363 return -EOPNOTSUPP; 364 } 365 if (bpf->maps.max_maps == bpf->maps_in_use) { 366 pr_info("too many maps for a device\n"); 367 return -ENOMEM; 368 } 369 if (bpf->maps.max_elems - bpf->map_elems_in_use < 370 offmap->map.max_entries) { 371 pr_info("map with too many elements: %u, left: %u\n", 372 offmap->map.max_entries, 373 bpf->maps.max_elems - bpf->map_elems_in_use); 374 return -ENOMEM; 375 } 376 377 if (round_up(offmap->map.key_size, 8) + 378 round_up(offmap->map.value_size, 8) > bpf->maps.max_elem_sz) { 379 pr_info("map elements too large: %u, FW max element size (key+value): %u\n", 380 round_up(offmap->map.key_size, 8) + 381 round_up(offmap->map.value_size, 8), 382 bpf->maps.max_elem_sz); 383 return -ENOMEM; 384 } 385 if (offmap->map.key_size > bpf->maps.max_key_sz) { 386 pr_info("map key size %u, FW max is %u\n", 387 offmap->map.key_size, bpf->maps.max_key_sz); 388 return -ENOMEM; 389 } 390 if (offmap->map.value_size > bpf->maps.max_val_sz) { 391 pr_info("map value size %u, FW max is %u\n", 392 offmap->map.value_size, bpf->maps.max_val_sz); 393 return -ENOMEM; 394 } 395 396 use_map_size = DIV_ROUND_UP(offmap->map.value_size, 4) * 397 FIELD_SIZEOF(struct nfp_bpf_map, use_map[0]); 398 399 nfp_map = kzalloc(sizeof(*nfp_map) + use_map_size, GFP_USER); 400 if (!nfp_map) 401 return -ENOMEM; 402 403 offmap->dev_priv = nfp_map; 404 nfp_map->offmap = offmap; 405 nfp_map->bpf = bpf; 406 407 res = nfp_bpf_ctrl_alloc_map(bpf, &offmap->map); 408 if (res < 0) { 409 kfree(nfp_map); 410 return res; 411 } 412 413 nfp_map->tid = res; 414 offmap->dev_ops = &nfp_bpf_map_ops; 415 bpf->maps_in_use++; 416 bpf->map_elems_in_use += offmap->map.max_entries; 417 list_add_tail(&nfp_map->l, &bpf->map_list); 418 419 return 0; 420 } 421 422 static int 423 nfp_bpf_map_free(struct nfp_app_bpf *bpf, struct bpf_offloaded_map *offmap) 424 { 425 struct nfp_bpf_map *nfp_map = offmap->dev_priv; 426 427 nfp_bpf_ctrl_free_map(bpf, nfp_map); 428 list_del_init(&nfp_map->l); 429 bpf->map_elems_in_use -= offmap->map.max_entries; 430 bpf->maps_in_use--; 431 kfree(nfp_map); 432 433 return 0; 434 } 435 436 int nfp_ndo_bpf(struct nfp_app *app, struct nfp_net *nn, struct netdev_bpf *bpf) 437 { 438 switch (bpf->command) { 439 case BPF_OFFLOAD_VERIFIER_PREP: 440 return nfp_bpf_verifier_prep(app, nn, bpf); 441 case BPF_OFFLOAD_TRANSLATE: 442 return nfp_bpf_translate(nn, bpf->offload.prog); 443 case BPF_OFFLOAD_DESTROY: 444 return nfp_bpf_destroy(nn, bpf->offload.prog); 445 case BPF_OFFLOAD_MAP_ALLOC: 446 return nfp_bpf_map_alloc(app->priv, bpf->offmap); 447 case BPF_OFFLOAD_MAP_FREE: 448 return nfp_bpf_map_free(app->priv, bpf->offmap); 449 default: 450 return -EINVAL; 451 } 452 } 453 454 static unsigned long 455 nfp_bpf_perf_event_copy(void *dst, const void *src, 456 unsigned long off, unsigned long len) 457 { 458 memcpy(dst, src + off, len); 459 return 0; 460 } 461 462 int nfp_bpf_event_output(struct nfp_app_bpf *bpf, const void *data, 463 unsigned int len) 464 { 465 struct cmsg_bpf_event *cbe = (void *)data; 466 struct nfp_bpf_neutral_map *record; 467 u32 pkt_size, data_size, map_id; 468 u64 map_id_full; 469 470 if (len < sizeof(struct cmsg_bpf_event)) 471 return -EINVAL; 472 473 pkt_size = be32_to_cpu(cbe->pkt_size); 474 data_size = be32_to_cpu(cbe->data_size); 475 map_id_full = be64_to_cpu(cbe->map_ptr); 476 map_id = map_id_full; 477 478 if (len < sizeof(struct cmsg_bpf_event) + pkt_size + data_size) 479 return -EINVAL; 480 if (cbe->hdr.ver != CMSG_MAP_ABI_VERSION) 481 return -EINVAL; 482 483 rcu_read_lock(); 484 record = rhashtable_lookup_fast(&bpf->maps_neutral, &map_id, 485 nfp_bpf_maps_neutral_params); 486 if (!record || map_id_full > U32_MAX) { 487 rcu_read_unlock(); 488 cmsg_warn(bpf, "perf event: map id %lld (0x%llx) not recognized, dropping event\n", 489 map_id_full, map_id_full); 490 return -EINVAL; 491 } 492 493 bpf_event_output(record->ptr, be32_to_cpu(cbe->cpu_id), 494 &cbe->data[round_up(pkt_size, 4)], data_size, 495 cbe->data, pkt_size, nfp_bpf_perf_event_copy); 496 rcu_read_unlock(); 497 498 return 0; 499 } 500 501 static int 502 nfp_net_bpf_load(struct nfp_net *nn, struct bpf_prog *prog, 503 struct netlink_ext_ack *extack) 504 { 505 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv; 506 unsigned int max_mtu; 507 dma_addr_t dma_addr; 508 void *img; 509 int err; 510 511 max_mtu = nn_readb(nn, NFP_NET_CFG_BPF_INL_MTU) * 64 - 32; 512 if (max_mtu < nn->dp.netdev->mtu) { 513 NL_SET_ERR_MSG_MOD(extack, "BPF offload not supported with MTU larger than HW packet split boundary"); 514 return -EOPNOTSUPP; 515 } 516 517 img = nfp_bpf_relo_for_vnic(nfp_prog, nn->app_priv); 518 if (IS_ERR(img)) 519 return PTR_ERR(img); 520 521 dma_addr = dma_map_single(nn->dp.dev, img, 522 nfp_prog->prog_len * sizeof(u64), 523 DMA_TO_DEVICE); 524 if (dma_mapping_error(nn->dp.dev, dma_addr)) { 525 kfree(img); 526 return -ENOMEM; 527 } 528 529 nn_writew(nn, NFP_NET_CFG_BPF_SIZE, nfp_prog->prog_len); 530 nn_writeq(nn, NFP_NET_CFG_BPF_ADDR, dma_addr); 531 532 /* Load up the JITed code */ 533 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_BPF); 534 if (err) 535 NL_SET_ERR_MSG_MOD(extack, 536 "FW command error while loading BPF"); 537 538 dma_unmap_single(nn->dp.dev, dma_addr, nfp_prog->prog_len * sizeof(u64), 539 DMA_TO_DEVICE); 540 kfree(img); 541 542 return err; 543 } 544 545 static void 546 nfp_net_bpf_start(struct nfp_net *nn, struct netlink_ext_ack *extack) 547 { 548 int err; 549 550 /* Enable passing packets through BPF function */ 551 nn->dp.ctrl |= NFP_NET_CFG_CTRL_BPF; 552 nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl); 553 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN); 554 if (err) 555 NL_SET_ERR_MSG_MOD(extack, 556 "FW command error while enabling BPF"); 557 } 558 559 static int nfp_net_bpf_stop(struct nfp_net *nn) 560 { 561 if (!(nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF)) 562 return 0; 563 564 nn->dp.ctrl &= ~NFP_NET_CFG_CTRL_BPF; 565 nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl); 566 567 return nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN); 568 } 569 570 int nfp_net_bpf_offload(struct nfp_net *nn, struct bpf_prog *prog, 571 bool old_prog, struct netlink_ext_ack *extack) 572 { 573 int err; 574 575 if (prog && !bpf_offload_dev_match(prog, nn->dp.netdev)) 576 return -EINVAL; 577 578 if (prog && old_prog) { 579 u8 cap; 580 581 cap = nn_readb(nn, NFP_NET_CFG_BPF_CAP); 582 if (!(cap & NFP_NET_BPF_CAP_RELO)) { 583 NL_SET_ERR_MSG_MOD(extack, 584 "FW does not support live reload"); 585 return -EBUSY; 586 } 587 } 588 589 /* Something else is loaded, different program type? */ 590 if (!old_prog && nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF) 591 return -EBUSY; 592 593 if (old_prog && !prog) 594 return nfp_net_bpf_stop(nn); 595 596 err = nfp_net_bpf_load(nn, prog, extack); 597 if (err) 598 return err; 599 600 if (!old_prog) 601 nfp_net_bpf_start(nn, extack); 602 603 return 0; 604 } 605