1 // SPDX-License-Identifier: (GPL-2.0-only OR BSD-2-Clause)
2 /* Copyright (C) 2016-2018 Netronome Systems, Inc. */
6 * Netronome network device driver: TC offload functions for PF and VF
9 #define pr_fmt(fmt) "NFP net bpf: " fmt
11 #include <linux/bpf.h>
12 #include <linux/kernel.h>
13 #include <linux/netdevice.h>
14 #include <linux/pci.h>
15 #include <linux/jiffies.h>
16 #include <linux/timer.h>
17 #include <linux/list.h>
20 #include <net/pkt_cls.h>
21 #include <net/tc_act/tc_gact.h>
22 #include <net/tc_act/tc_mirred.h>
25 #include "../nfp_app.h"
26 #include "../nfp_net_ctrl.h"
27 #include "../nfp_net.h"
30 nfp_map_ptr_record(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog,
33 struct nfp_bpf_neutral_map *record;
36 /* Reuse path - other offloaded program is already tracking this map. */
37 record = rhashtable_lookup_fast(&bpf->maps_neutral, &map->id,
38 nfp_bpf_maps_neutral_params);
40 nfp_prog->map_records[nfp_prog->map_records_cnt++] = record;
45 /* Grab a single ref to the map for our record. The prog destroy ndo
46 * happens after free_used_maps().
48 map = bpf_map_inc(map, false);
52 record = kmalloc(sizeof(*record), GFP_KERNEL);
59 record->map_id = map->id;
62 err = rhashtable_insert_fast(&bpf->maps_neutral, &record->l,
63 nfp_bpf_maps_neutral_params);
67 nfp_prog->map_records[nfp_prog->map_records_cnt++] = record;
79 nfp_map_ptrs_forget(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog)
84 for (i = 0; i < nfp_prog->map_records_cnt; i++) {
85 if (--nfp_prog->map_records[i]->count) {
86 nfp_prog->map_records[i] = NULL;
90 WARN_ON(rhashtable_remove_fast(&bpf->maps_neutral,
91 &nfp_prog->map_records[i]->l,
92 nfp_bpf_maps_neutral_params));
99 for (i = 0; i < nfp_prog->map_records_cnt; i++)
100 if (nfp_prog->map_records[i]) {
101 bpf_map_put(nfp_prog->map_records[i]->ptr);
102 kfree(nfp_prog->map_records[i]);
106 kfree(nfp_prog->map_records);
107 nfp_prog->map_records = NULL;
108 nfp_prog->map_records_cnt = 0;
112 nfp_map_ptrs_record(struct nfp_app_bpf *bpf, struct nfp_prog *nfp_prog,
113 struct bpf_prog *prog)
117 /* Quickly count the maps we will have to remember */
119 for (i = 0; i < prog->aux->used_map_cnt; i++)
120 if (bpf_map_offload_neutral(prog->aux->used_maps[i]))
125 nfp_prog->map_records = kmalloc_array(cnt,
126 sizeof(nfp_prog->map_records[0]),
128 if (!nfp_prog->map_records)
131 for (i = 0; i < prog->aux->used_map_cnt; i++)
132 if (bpf_map_offload_neutral(prog->aux->used_maps[i])) {
133 err = nfp_map_ptr_record(bpf, nfp_prog,
134 prog->aux->used_maps[i]);
136 nfp_map_ptrs_forget(bpf, nfp_prog);
140 WARN_ON(cnt != nfp_prog->map_records_cnt);
146 nfp_prog_prepare(struct nfp_prog *nfp_prog, const struct bpf_insn *prog,
149 struct nfp_insn_meta *meta;
152 for (i = 0; i < cnt; i++) {
153 meta = kzalloc(sizeof(*meta), GFP_KERNEL);
157 meta->insn = prog[i];
159 if (is_mbpf_alu(meta)) {
160 meta->umin_src = U64_MAX;
161 meta->umin_dst = U64_MAX;
164 list_add_tail(&meta->l, &nfp_prog->insns);
167 nfp_bpf_jit_prepare(nfp_prog, cnt);
172 static void nfp_prog_free(struct nfp_prog *nfp_prog)
174 struct nfp_insn_meta *meta, *tmp;
176 kfree(nfp_prog->subprog);
178 list_for_each_entry_safe(meta, tmp, &nfp_prog->insns, l) {
186 nfp_bpf_verifier_prep(struct net_device *netdev, struct bpf_verifier_env *env)
188 struct nfp_net *nn = netdev_priv(netdev);
189 struct bpf_prog *prog = env->prog;
190 struct nfp_app *app = nn->app;
191 struct nfp_prog *nfp_prog;
194 nfp_prog = kzalloc(sizeof(*nfp_prog), GFP_KERNEL);
197 prog->aux->offload->dev_priv = nfp_prog;
199 INIT_LIST_HEAD(&nfp_prog->insns);
200 nfp_prog->type = prog->type;
201 nfp_prog->bpf = app->priv;
203 ret = nfp_prog_prepare(nfp_prog, prog->insnsi, prog->len);
207 nfp_prog->verifier_meta = nfp_prog_first_meta(nfp_prog);
212 nfp_prog_free(nfp_prog);
217 static int nfp_bpf_translate(struct net_device *netdev, struct bpf_prog *prog)
219 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv;
220 struct nfp_net *nn = netdev_priv(netdev);
221 unsigned int max_instr;
224 max_instr = nn_readw(nn, NFP_NET_CFG_BPF_MAX_LEN);
225 nfp_prog->__prog_alloc_len = max_instr * sizeof(u64);
227 nfp_prog->prog = kvmalloc(nfp_prog->__prog_alloc_len, GFP_KERNEL);
231 err = nfp_bpf_jit(nfp_prog);
235 prog->aux->offload->jited_len = nfp_prog->prog_len * sizeof(u64);
236 prog->aux->offload->jited_image = nfp_prog->prog;
238 return nfp_map_ptrs_record(nfp_prog->bpf, nfp_prog, prog);
241 static int nfp_bpf_destroy(struct nfp_net *nn, struct bpf_prog *prog)
243 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv;
245 kvfree(nfp_prog->prog);
246 nfp_map_ptrs_forget(nfp_prog->bpf, nfp_prog);
247 nfp_prog_free(nfp_prog);
252 /* Atomic engine requires values to be in big endian, we need to byte swap
253 * the value words used with xadd.
255 static void nfp_map_bpf_byte_swap(struct nfp_bpf_map *nfp_map, void *value)
260 for (i = 0; i < DIV_ROUND_UP(nfp_map->offmap->map.value_size, 4); i++)
261 if (nfp_map->use_map[i].type == NFP_MAP_USE_ATOMIC_CNT)
262 word[i] = (__force u32)cpu_to_be32(word[i]);
265 /* Mark value as unsafely initialized in case it becomes atomic later
266 * and we didn't byte swap something non-byte swap neutral.
269 nfp_map_bpf_byte_swap_record(struct nfp_bpf_map *nfp_map, void *value)
274 for (i = 0; i < DIV_ROUND_UP(nfp_map->offmap->map.value_size, 4); i++)
275 if (nfp_map->use_map[i].type == NFP_MAP_UNUSED &&
276 word[i] != (__force u32)cpu_to_be32(word[i]))
277 nfp_map->use_map[i].non_zero_update = 1;
281 nfp_bpf_map_lookup_entry(struct bpf_offloaded_map *offmap,
282 void *key, void *value)
286 err = nfp_bpf_ctrl_lookup_entry(offmap, key, value);
290 nfp_map_bpf_byte_swap(offmap->dev_priv, value);
295 nfp_bpf_map_update_entry(struct bpf_offloaded_map *offmap,
296 void *key, void *value, u64 flags)
298 nfp_map_bpf_byte_swap(offmap->dev_priv, value);
299 nfp_map_bpf_byte_swap_record(offmap->dev_priv, value);
300 return nfp_bpf_ctrl_update_entry(offmap, key, value, flags);
304 nfp_bpf_map_get_next_key(struct bpf_offloaded_map *offmap,
305 void *key, void *next_key)
308 return nfp_bpf_ctrl_getfirst_entry(offmap, next_key);
309 return nfp_bpf_ctrl_getnext_entry(offmap, key, next_key);
313 nfp_bpf_map_delete_elem(struct bpf_offloaded_map *offmap, void *key)
315 if (offmap->map.map_type == BPF_MAP_TYPE_ARRAY)
317 return nfp_bpf_ctrl_del_entry(offmap, key);
320 static const struct bpf_map_dev_ops nfp_bpf_map_ops = {
321 .map_get_next_key = nfp_bpf_map_get_next_key,
322 .map_lookup_elem = nfp_bpf_map_lookup_entry,
323 .map_update_elem = nfp_bpf_map_update_entry,
324 .map_delete_elem = nfp_bpf_map_delete_elem,
328 nfp_bpf_map_alloc(struct nfp_app_bpf *bpf, struct bpf_offloaded_map *offmap)
330 struct nfp_bpf_map *nfp_map;
331 unsigned int use_map_size;
334 if (!bpf->maps.types)
337 if (offmap->map.map_flags ||
338 offmap->map.numa_node != NUMA_NO_NODE) {
339 pr_info("map flags are not supported\n");
343 if (!(bpf->maps.types & 1 << offmap->map.map_type)) {
344 pr_info("map type not supported\n");
347 if (bpf->maps.max_maps == bpf->maps_in_use) {
348 pr_info("too many maps for a device\n");
351 if (bpf->maps.max_elems - bpf->map_elems_in_use <
352 offmap->map.max_entries) {
353 pr_info("map with too many elements: %u, left: %u\n",
354 offmap->map.max_entries,
355 bpf->maps.max_elems - bpf->map_elems_in_use);
359 if (round_up(offmap->map.key_size, 8) +
360 round_up(offmap->map.value_size, 8) > bpf->maps.max_elem_sz) {
361 pr_info("map elements too large: %u, FW max element size (key+value): %u\n",
362 round_up(offmap->map.key_size, 8) +
363 round_up(offmap->map.value_size, 8),
364 bpf->maps.max_elem_sz);
367 if (offmap->map.key_size > bpf->maps.max_key_sz) {
368 pr_info("map key size %u, FW max is %u\n",
369 offmap->map.key_size, bpf->maps.max_key_sz);
372 if (offmap->map.value_size > bpf->maps.max_val_sz) {
373 pr_info("map value size %u, FW max is %u\n",
374 offmap->map.value_size, bpf->maps.max_val_sz);
378 use_map_size = DIV_ROUND_UP(offmap->map.value_size, 4) *
379 FIELD_SIZEOF(struct nfp_bpf_map, use_map[0]);
381 nfp_map = kzalloc(sizeof(*nfp_map) + use_map_size, GFP_USER);
385 offmap->dev_priv = nfp_map;
386 nfp_map->offmap = offmap;
389 res = nfp_bpf_ctrl_alloc_map(bpf, &offmap->map);
396 offmap->dev_ops = &nfp_bpf_map_ops;
398 bpf->map_elems_in_use += offmap->map.max_entries;
399 list_add_tail(&nfp_map->l, &bpf->map_list);
405 nfp_bpf_map_free(struct nfp_app_bpf *bpf, struct bpf_offloaded_map *offmap)
407 struct nfp_bpf_map *nfp_map = offmap->dev_priv;
409 nfp_bpf_ctrl_free_map(bpf, nfp_map);
410 list_del_init(&nfp_map->l);
411 bpf->map_elems_in_use -= offmap->map.max_entries;
418 int nfp_ndo_bpf(struct nfp_app *app, struct nfp_net *nn, struct netdev_bpf *bpf)
420 switch (bpf->command) {
421 case BPF_OFFLOAD_DESTROY:
422 return nfp_bpf_destroy(nn, bpf->offload.prog);
423 case BPF_OFFLOAD_MAP_ALLOC:
424 return nfp_bpf_map_alloc(app->priv, bpf->offmap);
425 case BPF_OFFLOAD_MAP_FREE:
426 return nfp_bpf_map_free(app->priv, bpf->offmap);
433 nfp_bpf_perf_event_copy(void *dst, const void *src,
434 unsigned long off, unsigned long len)
436 memcpy(dst, src + off, len);
440 int nfp_bpf_event_output(struct nfp_app_bpf *bpf, const void *data,
443 struct cmsg_bpf_event *cbe = (void *)data;
444 struct nfp_bpf_neutral_map *record;
445 u32 pkt_size, data_size, map_id;
448 if (len < sizeof(struct cmsg_bpf_event))
451 pkt_size = be32_to_cpu(cbe->pkt_size);
452 data_size = be32_to_cpu(cbe->data_size);
453 map_id_full = be64_to_cpu(cbe->map_ptr);
454 map_id = map_id_full;
456 if (len < sizeof(struct cmsg_bpf_event) + pkt_size + data_size)
458 if (cbe->hdr.ver != CMSG_MAP_ABI_VERSION)
462 record = rhashtable_lookup_fast(&bpf->maps_neutral, &map_id,
463 nfp_bpf_maps_neutral_params);
464 if (!record || map_id_full > U32_MAX) {
466 cmsg_warn(bpf, "perf event: map id %lld (0x%llx) not recognized, dropping event\n",
467 map_id_full, map_id_full);
471 bpf_event_output(record->ptr, be32_to_cpu(cbe->cpu_id),
472 &cbe->data[round_up(pkt_size, 4)], data_size,
473 cbe->data, pkt_size, nfp_bpf_perf_event_copy);
480 nfp_net_bpf_load(struct nfp_net *nn, struct bpf_prog *prog,
481 struct netlink_ext_ack *extack)
483 struct nfp_prog *nfp_prog = prog->aux->offload->dev_priv;
484 unsigned int fw_mtu, pkt_off, max_stack, max_prog_len;
489 fw_mtu = nn_readb(nn, NFP_NET_CFG_BPF_INL_MTU) * 64 - 32;
490 pkt_off = min(prog->aux->max_pkt_offset, nn->dp.netdev->mtu);
491 if (fw_mtu < pkt_off) {
492 NL_SET_ERR_MSG_MOD(extack, "BPF offload not supported with potential packet access beyond HW packet split boundary");
496 max_stack = nn_readb(nn, NFP_NET_CFG_BPF_STACK_SZ) * 64;
497 if (nfp_prog->stack_size > max_stack) {
498 NL_SET_ERR_MSG_MOD(extack, "stack too large");
502 max_prog_len = nn_readw(nn, NFP_NET_CFG_BPF_MAX_LEN);
503 if (nfp_prog->prog_len > max_prog_len) {
504 NL_SET_ERR_MSG_MOD(extack, "program too long");
508 img = nfp_bpf_relo_for_vnic(nfp_prog, nn->app_priv);
512 dma_addr = dma_map_single(nn->dp.dev, img,
513 nfp_prog->prog_len * sizeof(u64),
515 if (dma_mapping_error(nn->dp.dev, dma_addr)) {
520 nn_writew(nn, NFP_NET_CFG_BPF_SIZE, nfp_prog->prog_len);
521 nn_writeq(nn, NFP_NET_CFG_BPF_ADDR, dma_addr);
523 /* Load up the JITed code */
524 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_BPF);
526 NL_SET_ERR_MSG_MOD(extack,
527 "FW command error while loading BPF");
529 dma_unmap_single(nn->dp.dev, dma_addr, nfp_prog->prog_len * sizeof(u64),
537 nfp_net_bpf_start(struct nfp_net *nn, struct netlink_ext_ack *extack)
541 /* Enable passing packets through BPF function */
542 nn->dp.ctrl |= NFP_NET_CFG_CTRL_BPF;
543 nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl);
544 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN);
546 NL_SET_ERR_MSG_MOD(extack,
547 "FW command error while enabling BPF");
550 static int nfp_net_bpf_stop(struct nfp_net *nn)
552 if (!(nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF))
555 nn->dp.ctrl &= ~NFP_NET_CFG_CTRL_BPF;
556 nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl);
558 return nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN);
561 int nfp_net_bpf_offload(struct nfp_net *nn, struct bpf_prog *prog,
562 bool old_prog, struct netlink_ext_ack *extack)
566 if (prog && !bpf_offload_dev_match(prog, nn->dp.netdev))
569 if (prog && old_prog) {
572 cap = nn_readb(nn, NFP_NET_CFG_BPF_CAP);
573 if (!(cap & NFP_NET_BPF_CAP_RELO)) {
574 NL_SET_ERR_MSG_MOD(extack,
575 "FW does not support live reload");
580 /* Something else is loaded, different program type? */
581 if (!old_prog && nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF)
584 if (old_prog && !prog)
585 return nfp_net_bpf_stop(nn);
587 err = nfp_net_bpf_load(nn, prog, extack);
592 nfp_net_bpf_start(nn, extack);
597 const struct bpf_prog_offload_ops nfp_bpf_dev_ops = {
598 .insn_hook = nfp_verify_insn,
599 .finalize = nfp_bpf_finalize,
600 .prepare = nfp_bpf_verifier_prep,
601 .translate = nfp_bpf_translate,