treewide: Use fallthrough pseudo-keyword
[linux-block.git] / drivers / net / ethernet / netronome / nfp / nfp_net_common.c
CommitLineData
96de2506
JK
1// SPDX-License-Identifier: (GPL-2.0-only OR BSD-2-Clause)
2/* Copyright (C) 2015-2018 Netronome Systems, Inc. */
4c352362
JK
3
4/*
5 * nfp_net_common.c
6 * Netronome network device driver: Common functions between PF and VF
7 * Authors: Jakub Kicinski <jakub.kicinski@netronome.com>
8 * Jason McMullan <jason.mcmullan@netronome.com>
9 * Rolf Neugebauer <rolf.neugebauer@netronome.com>
10 * Brad Petrus <brad.petrus@netronome.com>
11 * Chris Telfer <chris.telfer@netronome.com>
12 */
13
9ff304bf 14#include <linux/bitfield.h>
ecd63a02 15#include <linux/bpf.h>
a67edbf4 16#include <linux/bpf_trace.h>
4c352362
JK
17#include <linux/module.h>
18#include <linux/kernel.h>
19#include <linux/init.h>
20#include <linux/fs.h>
21#include <linux/netdevice.h>
22#include <linux/etherdevice.h>
23#include <linux/interrupt.h>
24#include <linux/ip.h>
25#include <linux/ipv6.h>
46627170 26#include <linux/mm.h>
5ea14712 27#include <linux/overflow.h>
c0f031bc 28#include <linux/page_ref.h>
4c352362
JK
29#include <linux/pci.h>
30#include <linux/pci_regs.h>
31#include <linux/msi.h>
32#include <linux/ethtool.h>
33#include <linux/log2.h>
34#include <linux/if_vlan.h>
35#include <linux/random.h>
a7b1ad08 36#include <linux/vmalloc.h>
4c352362
JK
37#include <linux/ktime.h>
38
c3991d39 39#include <net/tls.h>
4c352362
JK
40#include <net/vxlan.h>
41
ce22f5a2 42#include "nfpcore/nfp_nsp.h"
e2c7114a 43#include "ccm.h"
bb45e51c 44#include "nfp_app.h"
4c352362
JK
45#include "nfp_net_ctrl.h"
46#include "nfp_net.h"
25528d90 47#include "nfp_net_sriov.h"
eb488c26 48#include "nfp_port.h"
232eeb1f 49#include "crypto/crypto.h"
6a35ddc5 50#include "crypto/fw.h"
4c352362
JK
51
52/**
53 * nfp_net_get_fw_version() - Read and parse the FW version
54 * @fw_ver: Output fw_version structure to read to
55 * @ctrl_bar: Mapped address of the control BAR
56 */
57void nfp_net_get_fw_version(struct nfp_net_fw_version *fw_ver,
58 void __iomem *ctrl_bar)
59{
60 u32 reg;
61
62 reg = readl(ctrl_bar + NFP_NET_CFG_VERSION);
63 put_unaligned_le32(reg, fw_ver);
64}
65
c487e6b1 66static dma_addr_t nfp_net_dma_map_rx(struct nfp_net_dp *dp, void *frag)
c0f031bc 67{
5cd4fbea
JK
68 return dma_map_single_attrs(dp->dev, frag + NFP_NET_RX_BUF_HEADROOM,
69 dp->fl_bufsz - NFP_NET_RX_BUF_NON_DATA,
70 dp->rx_dma_dir, DMA_ATTR_SKIP_CPU_SYNC);
71}
72
73static void
74nfp_net_dma_sync_dev_rx(const struct nfp_net_dp *dp, dma_addr_t dma_addr)
75{
76 dma_sync_single_for_device(dp->dev, dma_addr,
77 dp->fl_bufsz - NFP_NET_RX_BUF_NON_DATA,
78 dp->rx_dma_dir);
c0f031bc
JK
79}
80
c487e6b1 81static void nfp_net_dma_unmap_rx(struct nfp_net_dp *dp, dma_addr_t dma_addr)
c0f031bc 82{
5cd4fbea
JK
83 dma_unmap_single_attrs(dp->dev, dma_addr,
84 dp->fl_bufsz - NFP_NET_RX_BUF_NON_DATA,
85 dp->rx_dma_dir, DMA_ATTR_SKIP_CPU_SYNC);
86}
87
88static void nfp_net_dma_sync_cpu_rx(struct nfp_net_dp *dp, dma_addr_t dma_addr,
89 unsigned int len)
90{
91 dma_sync_single_for_cpu(dp->dev, dma_addr - NFP_NET_RX_BUF_HEADROOM,
92 len, dp->rx_dma_dir);
c0f031bc
JK
93}
94
3d780b92
JK
95/* Firmware reconfig
96 *
97 * Firmware reconfig may take a while so we have two versions of it -
98 * synchronous and asynchronous (posted). All synchronous callers are holding
99 * RTNL so we don't have to worry about serializing them.
100 */
101static void nfp_net_reconfig_start(struct nfp_net *nn, u32 update)
102{
103 nn_writel(nn, NFP_NET_CFG_UPDATE, update);
104 /* ensure update is written before pinging HW */
105 nn_pci_flush(nn);
106 nfp_qcp_wr_ptr_add(nn->qcp_cfg, 1);
6db3a9dc 107 nn->reconfig_in_progress_update = update;
3d780b92
JK
108}
109
110/* Pass 0 as update to run posted reconfigs. */
111static void nfp_net_reconfig_start_async(struct nfp_net *nn, u32 update)
112{
113 update |= nn->reconfig_posted;
114 nn->reconfig_posted = 0;
115
116 nfp_net_reconfig_start(nn, update);
117
118 nn->reconfig_timer_active = true;
119 mod_timer(&nn->reconfig_timer, jiffies + NFP_NET_POLL_TIMEOUT * HZ);
120}
121
122static bool nfp_net_reconfig_check_done(struct nfp_net *nn, bool last_check)
123{
124 u32 reg;
125
126 reg = nn_readl(nn, NFP_NET_CFG_UPDATE);
127 if (reg == 0)
128 return true;
129 if (reg & NFP_NET_CFG_UPDATE_ERR) {
6db3a9dc
JK
130 nn_err(nn, "Reconfig error (status: 0x%08x update: 0x%08x ctrl: 0x%08x)\n",
131 reg, nn->reconfig_in_progress_update,
132 nn_readl(nn, NFP_NET_CFG_CTRL));
3d780b92
JK
133 return true;
134 } else if (last_check) {
6db3a9dc
JK
135 nn_err(nn, "Reconfig timeout (status: 0x%08x update: 0x%08x ctrl: 0x%08x)\n",
136 reg, nn->reconfig_in_progress_update,
137 nn_readl(nn, NFP_NET_CFG_CTRL));
3d780b92
JK
138 return true;
139 }
140
141 return false;
142}
143
e6471828 144static bool __nfp_net_reconfig_wait(struct nfp_net *nn, unsigned long deadline)
3d780b92
JK
145{
146 bool timed_out = false;
e6471828
DM
147 int i;
148
149 /* Poll update field, waiting for NFP to ack the config.
150 * Do an opportunistic wait-busy loop, afterward sleep.
151 */
152 for (i = 0; i < 50; i++) {
153 if (nfp_net_reconfig_check_done(nn, false))
154 return false;
155 udelay(4);
156 }
3d780b92 157
3d780b92 158 while (!nfp_net_reconfig_check_done(nn, timed_out)) {
e6471828 159 usleep_range(250, 500);
3d780b92
JK
160 timed_out = time_is_before_eq_jiffies(deadline);
161 }
162
e6471828
DM
163 return timed_out;
164}
165
166static int nfp_net_reconfig_wait(struct nfp_net *nn, unsigned long deadline)
167{
168 if (__nfp_net_reconfig_wait(nn, deadline))
169 return -EIO;
170
3d780b92
JK
171 if (nn_readl(nn, NFP_NET_CFG_UPDATE) & NFP_NET_CFG_UPDATE_ERR)
172 return -EIO;
173
e6471828 174 return 0;
3d780b92
JK
175}
176
3248f77f 177static void nfp_net_reconfig_timer(struct timer_list *t)
3d780b92 178{
3248f77f 179 struct nfp_net *nn = from_timer(nn, t, reconfig_timer);
3d780b92
JK
180
181 spin_lock_bh(&nn->reconfig_lock);
182
183 nn->reconfig_timer_active = false;
184
185 /* If sync caller is present it will take over from us */
186 if (nn->reconfig_sync_present)
187 goto done;
188
189 /* Read reconfig status and report errors */
190 nfp_net_reconfig_check_done(nn, true);
191
192 if (nn->reconfig_posted)
193 nfp_net_reconfig_start_async(nn, 0);
194done:
195 spin_unlock_bh(&nn->reconfig_lock);
196}
197
198/**
199 * nfp_net_reconfig_post() - Post async reconfig request
200 * @nn: NFP Net device to reconfigure
201 * @update: The value for the update field in the BAR config
202 *
203 * Record FW reconfiguration request. Reconfiguration will be kicked off
204 * whenever reconfiguration machinery is idle. Multiple requests can be
205 * merged together!
206 */
207static void nfp_net_reconfig_post(struct nfp_net *nn, u32 update)
208{
209 spin_lock_bh(&nn->reconfig_lock);
210
211 /* Sync caller will kick off async reconf when it's done, just post */
212 if (nn->reconfig_sync_present) {
213 nn->reconfig_posted |= update;
214 goto done;
215 }
216
217 /* Opportunistically check if the previous command is done */
218 if (!nn->reconfig_timer_active ||
219 nfp_net_reconfig_check_done(nn, false))
220 nfp_net_reconfig_start_async(nn, update);
221 else
222 nn->reconfig_posted |= update;
223done:
224 spin_unlock_bh(&nn->reconfig_lock);
225}
226
9ad716b9 227static void nfp_net_reconfig_sync_enter(struct nfp_net *nn)
4c352362 228{
3d780b92
JK
229 bool cancelled_timer = false;
230 u32 pre_posted_requests;
4c352362
JK
231
232 spin_lock_bh(&nn->reconfig_lock);
233
e2c7114a 234 WARN_ON(nn->reconfig_sync_present);
3d780b92 235 nn->reconfig_sync_present = true;
4c352362 236
3d780b92 237 if (nn->reconfig_timer_active) {
3d780b92
JK
238 nn->reconfig_timer_active = false;
239 cancelled_timer = true;
240 }
241 pre_posted_requests = nn->reconfig_posted;
242 nn->reconfig_posted = 0;
243
244 spin_unlock_bh(&nn->reconfig_lock);
245
9ad716b9
JK
246 if (cancelled_timer) {
247 del_timer_sync(&nn->reconfig_timer);
3d780b92 248 nfp_net_reconfig_wait(nn, nn->reconfig_timer.expires);
9ad716b9 249 }
3d780b92
JK
250
251 /* Run the posted reconfigs which were issued before we started */
252 if (pre_posted_requests) {
253 nfp_net_reconfig_start(nn, pre_posted_requests);
254 nfp_net_reconfig_wait(nn, jiffies + HZ * NFP_NET_POLL_TIMEOUT);
4c352362 255 }
9ad716b9
JK
256}
257
258static void nfp_net_reconfig_wait_posted(struct nfp_net *nn)
259{
260 nfp_net_reconfig_sync_enter(nn);
261
262 spin_lock_bh(&nn->reconfig_lock);
263 nn->reconfig_sync_present = false;
264 spin_unlock_bh(&nn->reconfig_lock);
265}
266
267/**
dd5b2498 268 * __nfp_net_reconfig() - Reconfigure the firmware
9ad716b9
JK
269 * @nn: NFP Net device to reconfigure
270 * @update: The value for the update field in the BAR config
271 *
272 * Write the update word to the BAR and ping the reconfig queue. The
273 * poll until the firmware has acknowledged the update by zeroing the
274 * update word.
275 *
276 * Return: Negative errno on error, 0 on success
277 */
232eeb1f 278int __nfp_net_reconfig(struct nfp_net *nn, u32 update)
9ad716b9
JK
279{
280 int ret;
281
282 nfp_net_reconfig_sync_enter(nn);
4c352362 283
3d780b92
JK
284 nfp_net_reconfig_start(nn, update);
285 ret = nfp_net_reconfig_wait(nn, jiffies + HZ * NFP_NET_POLL_TIMEOUT);
286
287 spin_lock_bh(&nn->reconfig_lock);
288
289 if (nn->reconfig_posted)
290 nfp_net_reconfig_start_async(nn, 0);
291
292 nn->reconfig_sync_present = false;
293
4c352362 294 spin_unlock_bh(&nn->reconfig_lock);
3d780b92 295
4c352362
JK
296 return ret;
297}
298
dd5b2498
JK
299int nfp_net_reconfig(struct nfp_net *nn, u32 update)
300{
301 int ret;
302
303 nn_ctrl_bar_lock(nn);
304 ret = __nfp_net_reconfig(nn, update);
305 nn_ctrl_bar_unlock(nn);
306
307 return ret;
308}
309
310int nfp_net_mbox_lock(struct nfp_net *nn, unsigned int data_size)
311{
312 if (nn->tlv_caps.mbox_len < NFP_NET_CFG_MBOX_SIMPLE_VAL + data_size) {
313 nn_err(nn, "mailbox too small for %u of data (%u)\n",
314 data_size, nn->tlv_caps.mbox_len);
315 return -EIO;
316 }
317
318 nn_ctrl_bar_lock(nn);
319 return 0;
320}
321
b64052fc 322/**
dd5b2498 323 * nfp_net_mbox_reconfig() - Reconfigure the firmware via the mailbox
b64052fc
PC
324 * @nn: NFP Net device to reconfigure
325 * @mbox_cmd: The value for the mailbox command
326 *
327 * Helper function for mailbox updates
328 *
329 * Return: Negative errno on error, 0 on success
330 */
dd5b2498 331int nfp_net_mbox_reconfig(struct nfp_net *nn, u32 mbox_cmd)
b64052fc 332{
527d7d1b 333 u32 mbox = nn->tlv_caps.mbox_off;
b64052fc
PC
334 int ret;
335
527d7d1b 336 nn_writeq(nn, mbox + NFP_NET_CFG_MBOX_SIMPLE_CMD, mbox_cmd);
b64052fc 337
dd5b2498 338 ret = __nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_MBOX);
b64052fc
PC
339 if (ret) {
340 nn_err(nn, "Mailbox update error\n");
341 return ret;
342 }
343
527d7d1b 344 return -nn_readl(nn, mbox + NFP_NET_CFG_MBOX_SIMPLE_RET);
b64052fc
PC
345}
346
e2c7114a
JK
347void nfp_net_mbox_reconfig_post(struct nfp_net *nn, u32 mbox_cmd)
348{
349 u32 mbox = nn->tlv_caps.mbox_off;
350
351 nn_writeq(nn, mbox + NFP_NET_CFG_MBOX_SIMPLE_CMD, mbox_cmd);
352
353 nfp_net_reconfig_post(nn, NFP_NET_CFG_UPDATE_MBOX);
354}
355
356int nfp_net_mbox_reconfig_wait_posted(struct nfp_net *nn)
357{
358 u32 mbox = nn->tlv_caps.mbox_off;
359
360 nfp_net_reconfig_wait_posted(nn);
361
362 return -nn_readl(nn, mbox + NFP_NET_CFG_MBOX_SIMPLE_RET);
363}
364
dd5b2498
JK
365int nfp_net_mbox_reconfig_and_unlock(struct nfp_net *nn, u32 mbox_cmd)
366{
367 int ret;
368
369 ret = nfp_net_mbox_reconfig(nn, mbox_cmd);
370 nn_ctrl_bar_unlock(nn);
371 return ret;
372}
373
4c352362
JK
374/* Interrupt configuration and handling
375 */
376
4c352362
JK
377/**
378 * nfp_net_irq_unmask() - Unmask automasked interrupt
379 * @nn: NFP Network structure
380 * @entry_nr: MSI-X table entry
381 *
416db5c1 382 * Clear the ICR for the IRQ entry.
4c352362
JK
383 */
384static void nfp_net_irq_unmask(struct nfp_net *nn, unsigned int entry_nr)
385{
4c352362
JK
386 nn_writeb(nn, NFP_NET_CFG_ICR(entry_nr), NFP_NET_CFG_ICR_UNMASKED);
387 nn_pci_flush(nn);
388}
389
390/**
fdace6c2
JK
391 * nfp_net_irqs_alloc() - allocates MSI-X irqs
392 * @pdev: PCI device structure
393 * @irq_entries: Array to be initialized and used to hold the irq entries
394 * @min_irqs: Minimal acceptable number of interrupts
395 * @wanted_irqs: Target number of interrupts to allocate
4c352362 396 *
fdace6c2 397 * Return: Number of irqs obtained or 0 on error.
4c352362 398 */
fdace6c2
JK
399unsigned int
400nfp_net_irqs_alloc(struct pci_dev *pdev, struct msix_entry *irq_entries,
401 unsigned int min_irqs, unsigned int wanted_irqs)
4c352362 402{
fdace6c2
JK
403 unsigned int i;
404 int got_irqs;
4c352362 405
fdace6c2
JK
406 for (i = 0; i < wanted_irqs; i++)
407 irq_entries[i].entry = i;
4c352362 408
fdace6c2
JK
409 got_irqs = pci_enable_msix_range(pdev, irq_entries,
410 min_irqs, wanted_irqs);
411 if (got_irqs < 0) {
412 dev_err(&pdev->dev, "Failed to enable %d-%d MSI-X (err=%d)\n",
413 min_irqs, wanted_irqs, got_irqs);
4c352362
JK
414 return 0;
415 }
416
fdace6c2
JK
417 if (got_irqs < wanted_irqs)
418 dev_warn(&pdev->dev, "Unable to allocate %d IRQs got only %d\n",
419 wanted_irqs, got_irqs);
420
421 return got_irqs;
4c352362
JK
422}
423
4c352362 424/**
fdace6c2
JK
425 * nfp_net_irqs_assign() - Assign interrupts allocated externally to netdev
426 * @nn: NFP Network structure
427 * @irq_entries: Table of allocated interrupts
428 * @n: Size of @irq_entries (number of entries to grab)
4c352362 429 *
fdace6c2
JK
430 * After interrupts are allocated with nfp_net_irqs_alloc() this function
431 * should be called to assign them to a specific netdev (port).
4c352362 432 */
fdace6c2
JK
433void
434nfp_net_irqs_assign(struct nfp_net *nn, struct msix_entry *irq_entries,
435 unsigned int n)
4c352362 436{
79c12a75
JK
437 struct nfp_net_dp *dp = &nn->dp;
438
b33ae997 439 nn->max_r_vecs = n - NFP_NET_NON_Q_VECTORS;
79c12a75 440 dp->num_r_vecs = nn->max_r_vecs;
4c352362 441
fdace6c2 442 memcpy(nn->irq_entries, irq_entries, sizeof(*irq_entries) * n);
4c352362 443
79c12a75
JK
444 if (dp->num_rx_rings > dp->num_r_vecs ||
445 dp->num_tx_rings > dp->num_r_vecs)
87232d96
JK
446 dev_warn(nn->dp.dev, "More rings (%d,%d) than vectors (%d).\n",
447 dp->num_rx_rings, dp->num_tx_rings,
448 dp->num_r_vecs);
fdace6c2 449
79c12a75
JK
450 dp->num_rx_rings = min(dp->num_r_vecs, dp->num_rx_rings);
451 dp->num_tx_rings = min(dp->num_r_vecs, dp->num_tx_rings);
452 dp->num_stack_tx_rings = dp->num_tx_rings;
4c352362
JK
453}
454
455/**
456 * nfp_net_irqs_disable() - Disable interrupts
fdace6c2 457 * @pdev: PCI device structure
4c352362
JK
458 *
459 * Undoes what @nfp_net_irqs_alloc() does.
460 */
fdace6c2 461void nfp_net_irqs_disable(struct pci_dev *pdev)
4c352362 462{
fdace6c2 463 pci_disable_msix(pdev);
4c352362
JK
464}
465
466/**
467 * nfp_net_irq_rxtx() - Interrupt service routine for RX/TX rings.
468 * @irq: Interrupt
469 * @data: Opaque data structure
470 *
471 * Return: Indicate if the interrupt has been handled.
472 */
473static irqreturn_t nfp_net_irq_rxtx(int irq, void *data)
474{
475 struct nfp_net_r_vector *r_vec = data;
476
477 napi_schedule_irqoff(&r_vec->napi);
478
479 /* The FW auto-masks any interrupt, either via the MASK bit in
480 * the MSI-X table or via the per entry ICR field. So there
481 * is no need to disable interrupts here.
482 */
483 return IRQ_HANDLED;
484}
485
77ece8d5
JK
486static irqreturn_t nfp_ctrl_irq_rxtx(int irq, void *data)
487{
488 struct nfp_net_r_vector *r_vec = data;
489
490 tasklet_schedule(&r_vec->tasklet);
491
492 return IRQ_HANDLED;
493}
494
4c352362
JK
495/**
496 * nfp_net_read_link_status() - Reread link status from control BAR
497 * @nn: NFP Network structure
498 */
499static void nfp_net_read_link_status(struct nfp_net *nn)
500{
501 unsigned long flags;
502 bool link_up;
503 u32 sts;
504
505 spin_lock_irqsave(&nn->link_status_lock, flags);
506
507 sts = nn_readl(nn, NFP_NET_CFG_STS);
508 link_up = !!(sts & NFP_NET_CFG_STS_LINK);
509
510 if (nn->link_up == link_up)
511 goto out;
512
513 nn->link_up = link_up;
6d4f8cba
JK
514 if (nn->port)
515 set_bit(NFP_PORT_CHANGED, &nn->port->flags);
4c352362
JK
516
517 if (nn->link_up) {
79c12a75
JK
518 netif_carrier_on(nn->dp.netdev);
519 netdev_info(nn->dp.netdev, "NIC Link is Up\n");
4c352362 520 } else {
79c12a75
JK
521 netif_carrier_off(nn->dp.netdev);
522 netdev_info(nn->dp.netdev, "NIC Link is Down\n");
4c352362
JK
523 }
524out:
525 spin_unlock_irqrestore(&nn->link_status_lock, flags);
526}
527
528/**
529 * nfp_net_irq_lsc() - Interrupt service routine for link state changes
530 * @irq: Interrupt
531 * @data: Opaque data structure
532 *
533 * Return: Indicate if the interrupt has been handled.
534 */
535static irqreturn_t nfp_net_irq_lsc(int irq, void *data)
536{
537 struct nfp_net *nn = data;
fdace6c2
JK
538 struct msix_entry *entry;
539
540 entry = &nn->irq_entries[NFP_NET_IRQ_LSC_IDX];
4c352362
JK
541
542 nfp_net_read_link_status(nn);
543
fdace6c2 544 nfp_net_irq_unmask(nn, entry->entry);
4c352362
JK
545
546 return IRQ_HANDLED;
547}
548
549/**
550 * nfp_net_irq_exn() - Interrupt service routine for exceptions
551 * @irq: Interrupt
552 * @data: Opaque data structure
553 *
554 * Return: Indicate if the interrupt has been handled.
555 */
556static irqreturn_t nfp_net_irq_exn(int irq, void *data)
557{
558 struct nfp_net *nn = data;
559
560 nn_err(nn, "%s: UNIMPLEMENTED.\n", __func__);
561 /* XXX TO BE IMPLEMENTED */
562 return IRQ_HANDLED;
563}
564
565/**
566 * nfp_net_tx_ring_init() - Fill in the boilerplate for a TX ring
567 * @tx_ring: TX ring structure
d79737c2
JK
568 * @r_vec: IRQ vector servicing this ring
569 * @idx: Ring index
92e68195 570 * @is_xdp: Is this an XDP TX ring?
4c352362 571 */
d79737c2
JK
572static void
573nfp_net_tx_ring_init(struct nfp_net_tx_ring *tx_ring,
92e68195
JK
574 struct nfp_net_r_vector *r_vec, unsigned int idx,
575 bool is_xdp)
4c352362 576{
4c352362
JK
577 struct nfp_net *nn = r_vec->nfp_net;
578
d79737c2
JK
579 tx_ring->idx = idx;
580 tx_ring->r_vec = r_vec;
92e68195 581 tx_ring->is_xdp = is_xdp;
7ceb781a 582 u64_stats_init(&tx_ring->r_vec->tx_sync);
d79737c2 583
4c352362
JK
584 tx_ring->qcidx = tx_ring->idx * nn->stride_tx;
585 tx_ring->qcp_q = nn->tx_bar + NFP_QCP_QUEUE_OFF(tx_ring->qcidx);
586}
587
588/**
589 * nfp_net_rx_ring_init() - Fill in the boilerplate for a RX ring
590 * @rx_ring: RX ring structure
d79737c2
JK
591 * @r_vec: IRQ vector servicing this ring
592 * @idx: Ring index
4c352362 593 */
d79737c2
JK
594static void
595nfp_net_rx_ring_init(struct nfp_net_rx_ring *rx_ring,
596 struct nfp_net_r_vector *r_vec, unsigned int idx)
4c352362 597{
4c352362
JK
598 struct nfp_net *nn = r_vec->nfp_net;
599
d79737c2
JK
600 rx_ring->idx = idx;
601 rx_ring->r_vec = r_vec;
7ceb781a 602 u64_stats_init(&rx_ring->r_vec->rx_sync);
d79737c2 603
4c352362 604 rx_ring->fl_qcidx = rx_ring->idx * nn->stride_rx;
4c352362 605 rx_ring->qcp_fl = nn->rx_bar + NFP_QCP_QUEUE_OFF(rx_ring->fl_qcidx);
4c352362
JK
606}
607
4c352362
JK
608/**
609 * nfp_net_aux_irq_request() - Request an auxiliary interrupt (LSC or EXN)
610 * @nn: NFP Network structure
611 * @ctrl_offset: Control BAR offset where IRQ configuration should be written
612 * @format: printf-style format to construct the interrupt name
613 * @name: Pointer to allocated space for interrupt name
614 * @name_sz: Size of space for interrupt name
615 * @vector_idx: Index of MSI-X vector used for this interrupt
616 * @handler: IRQ handler to register for this interrupt
617 */
618static int
619nfp_net_aux_irq_request(struct nfp_net *nn, u32 ctrl_offset,
620 const char *format, char *name, size_t name_sz,
621 unsigned int vector_idx, irq_handler_t handler)
622{
623 struct msix_entry *entry;
624 int err;
625
626 entry = &nn->irq_entries[vector_idx];
627
77ece8d5 628 snprintf(name, name_sz, format, nfp_net_name(nn));
4c352362
JK
629 err = request_irq(entry->vector, handler, 0, name, nn);
630 if (err) {
631 nn_err(nn, "Failed to request IRQ %d (err=%d).\n",
632 entry->vector, err);
633 return err;
634 }
fdace6c2 635 nn_writeb(nn, ctrl_offset, entry->entry);
fc233650 636 nfp_net_irq_unmask(nn, entry->entry);
4c352362
JK
637
638 return 0;
639}
640
641/**
642 * nfp_net_aux_irq_free() - Free an auxiliary interrupt (LSC or EXN)
643 * @nn: NFP Network structure
644 * @ctrl_offset: Control BAR offset where IRQ configuration should be written
645 * @vector_idx: Index of MSI-X vector used for this interrupt
646 */
647static void nfp_net_aux_irq_free(struct nfp_net *nn, u32 ctrl_offset,
648 unsigned int vector_idx)
649{
650 nn_writeb(nn, ctrl_offset, 0xff);
fc233650 651 nn_pci_flush(nn);
4c352362
JK
652 free_irq(nn->irq_entries[vector_idx].vector, nn);
653}
654
655/* Transmit
656 *
657 * One queue controller peripheral queue is used for transmit. The
658 * driver en-queues packets for transmit by advancing the write
659 * pointer. The device indicates that packets have transmitted by
660 * advancing the read pointer. The driver maintains a local copy of
661 * the read and write pointer in @struct nfp_net_tx_ring. The driver
662 * keeps @wr_p in sync with the queue controller write pointer and can
663 * determine how many packets have been transmitted by comparing its
664 * copy of the read pointer @rd_p with the read pointer maintained by
665 * the queue controller peripheral.
666 */
667
668/**
669 * nfp_net_tx_full() - Check if the TX ring is full
670 * @tx_ring: TX ring to check
671 * @dcnt: Number of descriptors that need to be enqueued (must be >= 1)
672 *
673 * This function checks, based on the *host copy* of read/write
674 * pointer if a given TX ring is full. The real TX queue may have
675 * some newly made available slots.
676 *
677 * Return: True if the ring is full.
678 */
fa95f1d2 679static int nfp_net_tx_full(struct nfp_net_tx_ring *tx_ring, int dcnt)
4c352362
JK
680{
681 return (tx_ring->wr_p - tx_ring->rd_p) >= (tx_ring->cnt - dcnt);
682}
683
684/* Wrappers for deciding when to stop and restart TX queues */
685static int nfp_net_tx_ring_should_wake(struct nfp_net_tx_ring *tx_ring)
686{
687 return !nfp_net_tx_full(tx_ring, MAX_SKB_FRAGS * 4);
688}
689
690static int nfp_net_tx_ring_should_stop(struct nfp_net_tx_ring *tx_ring)
691{
692 return nfp_net_tx_full(tx_ring, MAX_SKB_FRAGS + 1);
693}
694
695/**
696 * nfp_net_tx_ring_stop() - stop tx ring
697 * @nd_q: netdev queue
698 * @tx_ring: driver tx queue structure
699 *
700 * Safely stop TX ring. Remember that while we are running .start_xmit()
701 * someone else may be cleaning the TX ring completions so we need to be
702 * extra careful here.
703 */
704static void nfp_net_tx_ring_stop(struct netdev_queue *nd_q,
705 struct nfp_net_tx_ring *tx_ring)
706{
707 netif_tx_stop_queue(nd_q);
708
709 /* We can race with the TX completion out of NAPI so recheck */
710 smp_mb();
711 if (unlikely(nfp_net_tx_ring_should_wake(tx_ring)))
712 netif_tx_start_queue(nd_q);
713}
714
715/**
716 * nfp_net_tx_tso() - Set up Tx descriptor for LSO
4c352362
JK
717 * @r_vec: per-ring structure
718 * @txbuf: Pointer to driver soft TX descriptor
719 * @txd: Pointer to HW TX descriptor
720 * @skb: Pointer to SKB
b54ad0ea 721 * @md_bytes: Prepend length
4c352362
JK
722 *
723 * Set up Tx descriptor for LSO, do nothing for non-LSO skbs.
724 * Return error on packet header greater than maximum supported LSO header size.
725 */
79c12a75 726static void nfp_net_tx_tso(struct nfp_net_r_vector *r_vec,
4c352362 727 struct nfp_net_tx_buf *txbuf,
b54ad0ea
JK
728 struct nfp_net_tx_desc *txd, struct sk_buff *skb,
729 u32 md_bytes)
4c352362 730{
b54ad0ea 731 u32 l3_offset, l4_offset, hdrlen;
4c352362
JK
732 u16 mss;
733
734 if (!skb_is_gso(skb))
735 return;
736
28063be6 737 if (!skb->encapsulation) {
b54ad0ea
JK
738 l3_offset = skb_network_offset(skb);
739 l4_offset = skb_transport_offset(skb);
4c352362 740 hdrlen = skb_transport_offset(skb) + tcp_hdrlen(skb);
28063be6 741 } else {
b54ad0ea
JK
742 l3_offset = skb_inner_network_offset(skb);
743 l4_offset = skb_inner_transport_offset(skb);
4c352362
JK
744 hdrlen = skb_inner_transport_header(skb) - skb->data +
745 inner_tcp_hdrlen(skb);
28063be6 746 }
4c352362
JK
747
748 txbuf->pkt_cnt = skb_shinfo(skb)->gso_segs;
749 txbuf->real_len += hdrlen * (txbuf->pkt_cnt - 1);
750
751 mss = skb_shinfo(skb)->gso_size & PCIE_DESC_TX_MSS_MASK;
b54ad0ea
JK
752 txd->l3_offset = l3_offset - md_bytes;
753 txd->l4_offset = l4_offset - md_bytes;
754 txd->lso_hdrlen = hdrlen - md_bytes;
4c352362
JK
755 txd->mss = cpu_to_le16(mss);
756 txd->flags |= PCIE_DESC_TX_LSO;
757
758 u64_stats_update_begin(&r_vec->tx_sync);
759 r_vec->tx_lso++;
760 u64_stats_update_end(&r_vec->tx_sync);
761}
762
763/**
764 * nfp_net_tx_csum() - Set TX CSUM offload flags in TX descriptor
79c12a75 765 * @dp: NFP Net data path struct
4c352362
JK
766 * @r_vec: per-ring structure
767 * @txbuf: Pointer to driver soft TX descriptor
768 * @txd: Pointer to TX descriptor
769 * @skb: Pointer to SKB
770 *
771 * This function sets the TX checksum flags in the TX descriptor based
772 * on the configuration and the protocol of the packet to be transmitted.
773 */
79c12a75
JK
774static void nfp_net_tx_csum(struct nfp_net_dp *dp,
775 struct nfp_net_r_vector *r_vec,
4c352362
JK
776 struct nfp_net_tx_buf *txbuf,
777 struct nfp_net_tx_desc *txd, struct sk_buff *skb)
778{
779 struct ipv6hdr *ipv6h;
780 struct iphdr *iph;
781 u8 l4_hdr;
782
79c12a75 783 if (!(dp->ctrl & NFP_NET_CFG_CTRL_TXCSUM))
4c352362
JK
784 return;
785
786 if (skb->ip_summed != CHECKSUM_PARTIAL)
787 return;
788
789 txd->flags |= PCIE_DESC_TX_CSUM;
790 if (skb->encapsulation)
791 txd->flags |= PCIE_DESC_TX_ENCAP;
792
793 iph = skb->encapsulation ? inner_ip_hdr(skb) : ip_hdr(skb);
794 ipv6h = skb->encapsulation ? inner_ipv6_hdr(skb) : ipv6_hdr(skb);
795
796 if (iph->version == 4) {
797 txd->flags |= PCIE_DESC_TX_IP4_CSUM;
798 l4_hdr = iph->protocol;
799 } else if (ipv6h->version == 6) {
800 l4_hdr = ipv6h->nexthdr;
801 } else {
79c12a75 802 nn_dp_warn(dp, "partial checksum but ipv=%x!\n", iph->version);
4c352362
JK
803 return;
804 }
805
806 switch (l4_hdr) {
807 case IPPROTO_TCP:
808 txd->flags |= PCIE_DESC_TX_TCP_CSUM;
809 break;
810 case IPPROTO_UDP:
811 txd->flags |= PCIE_DESC_TX_UDP_CSUM;
812 break;
813 default:
79c12a75 814 nn_dp_warn(dp, "partial checksum but l4 proto=%x!\n", l4_hdr);
4c352362
JK
815 return;
816 }
817
818 u64_stats_update_begin(&r_vec->tx_sync);
819 if (skb->encapsulation)
820 r_vec->hw_csum_tx_inner += txbuf->pkt_cnt;
821 else
822 r_vec->hw_csum_tx += txbuf->pkt_cnt;
823 u64_stats_update_end(&r_vec->tx_sync);
824}
825
c3991d39 826static struct sk_buff *
51a5e563
JK
827nfp_net_tls_tx(struct nfp_net_dp *dp, struct nfp_net_r_vector *r_vec,
828 struct sk_buff *skb, u64 *tls_handle, int *nr_frags)
c3991d39 829{
c8d3928e 830#ifdef CONFIG_TLS_DEVICE
c3991d39
DM
831 struct nfp_net_tls_offload_ctx *ntls;
832 struct sk_buff *nskb;
9ed431c1 833 bool resync_pending;
c3991d39
DM
834 u32 datalen, seq;
835
836 if (likely(!dp->ktls_tx))
837 return skb;
838 if (!skb->sk || !tls_is_sk_tx_device_offloaded(skb->sk))
839 return skb;
840
841 datalen = skb->len - (skb_transport_offset(skb) + tcp_hdrlen(skb));
842 seq = ntohl(tcp_hdr(skb)->seq);
843 ntls = tls_driver_ctx(skb->sk, TLS_OFFLOAD_CTX_DIR_TX);
9ed431c1
JK
844 resync_pending = tls_offload_tx_resync_pending(skb->sk);
845 if (unlikely(resync_pending || ntls->next_seq != seq)) {
c3991d39
DM
846 /* Pure ACK out of order already */
847 if (!datalen)
848 return skb;
849
51a5e563
JK
850 u64_stats_update_begin(&r_vec->tx_sync);
851 r_vec->tls_tx_fallback++;
852 u64_stats_update_end(&r_vec->tx_sync);
853
c3991d39 854 nskb = tls_encrypt_skb(skb);
51a5e563
JK
855 if (!nskb) {
856 u64_stats_update_begin(&r_vec->tx_sync);
857 r_vec->tls_tx_no_fallback++;
858 u64_stats_update_end(&r_vec->tx_sync);
c3991d39 859 return NULL;
51a5e563 860 }
c3991d39
DM
861 /* encryption wasn't necessary */
862 if (nskb == skb)
863 return skb;
864 /* we don't re-check ring space */
865 if (unlikely(skb_is_nonlinear(nskb))) {
866 nn_dp_warn(dp, "tls_encrypt_skb() produced fragmented frame\n");
51a5e563
JK
867 u64_stats_update_begin(&r_vec->tx_sync);
868 r_vec->tx_errors++;
869 u64_stats_update_end(&r_vec->tx_sync);
c3991d39
DM
870 dev_kfree_skb_any(nskb);
871 return NULL;
872 }
873
874 /* jump forward, a TX may have gotten lost, need to sync TX */
9ed431c1 875 if (!resync_pending && seq - ntls->next_seq < U32_MAX / 4)
8538d29c
JK
876 tls_offload_tx_resync_request(nskb->sk, seq,
877 ntls->next_seq);
c3991d39
DM
878
879 *nr_frags = 0;
880 return nskb;
881 }
882
51a5e563
JK
883 if (datalen) {
884 u64_stats_update_begin(&r_vec->tx_sync);
427545b3
JK
885 if (!skb_is_gso(skb))
886 r_vec->hw_tls_tx++;
887 else
888 r_vec->hw_tls_tx += skb_shinfo(skb)->gso_segs;
51a5e563
JK
889 u64_stats_update_end(&r_vec->tx_sync);
890 }
891
c3991d39
DM
892 memcpy(tls_handle, ntls->fw_handle, sizeof(ntls->fw_handle));
893 ntls->next_seq += datalen;
c8d3928e 894#endif
c3991d39
DM
895 return skb;
896}
c3991d39 897
5a4cea28
JK
898static void nfp_net_tls_tx_undo(struct sk_buff *skb, u64 tls_handle)
899{
900#ifdef CONFIG_TLS_DEVICE
901 struct nfp_net_tls_offload_ctx *ntls;
902 u32 datalen, seq;
903
904 if (!tls_handle)
905 return;
906 if (WARN_ON_ONCE(!skb->sk || !tls_is_sk_tx_device_offloaded(skb->sk)))
907 return;
908
909 datalen = skb->len - (skb_transport_offset(skb) + tcp_hdrlen(skb));
910 seq = ntohl(tcp_hdr(skb)->seq);
911
912 ntls = tls_driver_ctx(skb->sk, TLS_OFFLOAD_CTX_DIR_TX);
913 if (ntls->next_seq == seq + datalen)
914 ntls->next_seq = seq;
915 else
916 WARN_ON_ONCE(1);
917#endif
918}
919
ecd63a02
JK
920static void nfp_net_tx_xmit_more_flush(struct nfp_net_tx_ring *tx_ring)
921{
922 wmb();
923 nfp_qcp_wr_ptr_add(tx_ring->qcp_q, tx_ring->wr_ptr_add);
924 tx_ring->wr_ptr_add = 0;
925}
926
5584c0f8 927static int nfp_net_prep_tx_meta(struct sk_buff *skb, u64 tls_handle)
91bf82ca
SH
928{
929 struct metadata_dst *md_dst = skb_metadata_dst(skb);
930 unsigned char *data;
5584c0f8
JK
931 u32 meta_id = 0;
932 int md_bytes;
91bf82ca 933
5584c0f8 934 if (likely(!md_dst && !tls_handle))
91bf82ca 935 return 0;
5584c0f8
JK
936 if (unlikely(md_dst && md_dst->type != METADATA_HW_PORT_MUX)) {
937 if (!tls_handle)
938 return 0;
939 md_dst = NULL;
940 }
941
942 md_bytes = 4 + !!md_dst * 4 + !!tls_handle * 8;
91bf82ca 943
5584c0f8 944 if (unlikely(skb_cow_head(skb, md_bytes)))
91bf82ca
SH
945 return -ENOMEM;
946
5584c0f8
JK
947 meta_id = 0;
948 data = skb_push(skb, md_bytes) + md_bytes;
949 if (md_dst) {
950 data -= 4;
951 put_unaligned_be32(md_dst->u.port_info.port_id, data);
952 meta_id = NFP_NET_META_PORTID;
953 }
954 if (tls_handle) {
955 /* conn handle is opaque, we just use u64 to be able to quickly
956 * compare it to zero
957 */
958 data -= 8;
959 memcpy(data, &tls_handle, sizeof(tls_handle));
960 meta_id <<= NFP_NET_META_FIELD_SIZE;
961 meta_id |= NFP_NET_META_CONN_HANDLE;
962 }
963
964 data -= 4;
965 put_unaligned_be32(meta_id, data);
91bf82ca 966
5584c0f8 967 return md_bytes;
91bf82ca
SH
968}
969
4c352362
JK
970/**
971 * nfp_net_tx() - Main transmit entry point
972 * @skb: SKB to transmit
973 * @netdev: netdev structure
974 *
975 * Return: NETDEV_TX_OK on success.
976 */
737ce1e9 977static netdev_tx_t nfp_net_tx(struct sk_buff *skb, struct net_device *netdev)
4c352362
JK
978{
979 struct nfp_net *nn = netdev_priv(netdev);
d7840976 980 const skb_frag_t *frag;
91bf82ca 981 int f, nr_frags, wr_idx, md_bytes;
4c352362 982 struct nfp_net_tx_ring *tx_ring;
bef6b1b7
JK
983 struct nfp_net_r_vector *r_vec;
984 struct nfp_net_tx_buf *txbuf;
95862749 985 struct nfp_net_tx_desc *txd;
4c352362 986 struct netdev_queue *nd_q;
79c12a75 987 struct nfp_net_dp *dp;
4c352362
JK
988 dma_addr_t dma_addr;
989 unsigned int fsize;
5584c0f8 990 u64 tls_handle = 0;
4c352362
JK
991 u16 qidx;
992
79c12a75 993 dp = &nn->dp;
4c352362 994 qidx = skb_get_queue_mapping(skb);
79c12a75 995 tx_ring = &dp->tx_rings[qidx];
4c352362 996 r_vec = tx_ring->r_vec;
4c352362
JK
997
998 nr_frags = skb_shinfo(skb)->nr_frags;
999
1000 if (unlikely(nfp_net_tx_full(tx_ring, nr_frags + 1))) {
79c12a75
JK
1001 nn_dp_warn(dp, "TX ring %d busy. wrp=%u rdp=%u\n",
1002 qidx, tx_ring->wr_p, tx_ring->rd_p);
8b5ddf1e 1003 nd_q = netdev_get_tx_queue(dp->netdev, qidx);
4c352362 1004 netif_tx_stop_queue(nd_q);
28b0cfee 1005 nfp_net_tx_xmit_more_flush(tx_ring);
4c352362
JK
1006 u64_stats_update_begin(&r_vec->tx_sync);
1007 r_vec->tx_busy++;
1008 u64_stats_update_end(&r_vec->tx_sync);
1009 return NETDEV_TX_BUSY;
1010 }
1011
51a5e563
JK
1012 skb = nfp_net_tls_tx(dp, r_vec, skb, &tls_handle, &nr_frags);
1013 if (unlikely(!skb)) {
1014 nfp_net_tx_xmit_more_flush(tx_ring);
1015 return NETDEV_TX_OK;
1016 }
c3991d39 1017
5584c0f8 1018 md_bytes = nfp_net_prep_tx_meta(skb, tls_handle);
76581af2
JK
1019 if (unlikely(md_bytes < 0))
1020 goto err_flush;
91bf82ca 1021
4c352362 1022 /* Start with the head skbuf */
79c12a75 1023 dma_addr = dma_map_single(dp->dev, skb->data, skb_headlen(skb),
4c352362 1024 DMA_TO_DEVICE);
79c12a75 1025 if (dma_mapping_error(dp->dev, dma_addr))
76581af2 1026 goto err_dma_err;
4c352362 1027
4aa3b766 1028 wr_idx = D_IDX(tx_ring, tx_ring->wr_p);
4c352362
JK
1029
1030 /* Stash the soft descriptor of the head then initialize it */
1031 txbuf = &tx_ring->txbufs[wr_idx];
1032 txbuf->skb = skb;
1033 txbuf->dma_addr = dma_addr;
1034 txbuf->fidx = -1;
1035 txbuf->pkt_cnt = 1;
1036 txbuf->real_len = skb->len;
1037
1038 /* Build TX descriptor */
1039 txd = &tx_ring->txds[wr_idx];
91bf82ca 1040 txd->offset_eop = (nr_frags ? 0 : PCIE_DESC_TX_EOP) | md_bytes;
4c352362
JK
1041 txd->dma_len = cpu_to_le16(skb_headlen(skb));
1042 nfp_desc_set_dma_addr(txd, dma_addr);
1043 txd->data_len = cpu_to_le16(skb->len);
1044
1045 txd->flags = 0;
1046 txd->mss = 0;
e53fc9fa 1047 txd->lso_hdrlen = 0;
4c352362 1048
28063be6 1049 /* Do not reorder - tso may adjust pkt cnt, vlan may override fields */
b54ad0ea 1050 nfp_net_tx_tso(r_vec, txbuf, txd, skb, md_bytes);
79c12a75 1051 nfp_net_tx_csum(dp, r_vec, txbuf, txd, skb);
79c12a75 1052 if (skb_vlan_tag_present(skb) && dp->ctrl & NFP_NET_CFG_CTRL_TXVLAN) {
4c352362
JK
1053 txd->flags |= PCIE_DESC_TX_VLAN;
1054 txd->vlan = cpu_to_le16(skb_vlan_tag_get(skb));
1055 }
1056
1057 /* Gather DMA */
1058 if (nr_frags > 0) {
95862749
JK
1059 __le64 second_half;
1060
4c352362 1061 /* all descs must match except for in addr, length and eop */
95862749 1062 second_half = txd->vals8[1];
4c352362
JK
1063
1064 for (f = 0; f < nr_frags; f++) {
1065 frag = &skb_shinfo(skb)->frags[f];
1066 fsize = skb_frag_size(frag);
1067
79c12a75 1068 dma_addr = skb_frag_dma_map(dp->dev, frag, 0,
4c352362 1069 fsize, DMA_TO_DEVICE);
79c12a75 1070 if (dma_mapping_error(dp->dev, dma_addr))
4c352362
JK
1071 goto err_unmap;
1072
4aa3b766 1073 wr_idx = D_IDX(tx_ring, wr_idx + 1);
4c352362
JK
1074 tx_ring->txbufs[wr_idx].skb = skb;
1075 tx_ring->txbufs[wr_idx].dma_addr = dma_addr;
1076 tx_ring->txbufs[wr_idx].fidx = f;
1077
1078 txd = &tx_ring->txds[wr_idx];
4c352362
JK
1079 txd->dma_len = cpu_to_le16(fsize);
1080 nfp_desc_set_dma_addr(txd, dma_addr);
95862749
JK
1081 txd->offset_eop = md_bytes |
1082 ((f == nr_frags - 1) ? PCIE_DESC_TX_EOP : 0);
1083 txd->vals8[1] = second_half;
4c352362
JK
1084 }
1085
1086 u64_stats_update_begin(&r_vec->tx_sync);
1087 r_vec->tx_gather++;
1088 u64_stats_update_end(&r_vec->tx_sync);
1089 }
1090
46f1c52e
JK
1091 skb_tx_timestamp(skb);
1092
8b5ddf1e
JK
1093 nd_q = netdev_get_tx_queue(dp->netdev, tx_ring->idx);
1094
4c352362
JK
1095 tx_ring->wr_p += nr_frags + 1;
1096 if (nfp_net_tx_ring_should_stop(tx_ring))
1097 nfp_net_tx_ring_stop(nd_q, tx_ring);
1098
1099 tx_ring->wr_ptr_add += nr_frags + 1;
6b16f9ee 1100 if (__netdev_tx_sent_queue(nd_q, txbuf->real_len, netdev_xmit_more()))
ecd63a02 1101 nfp_net_tx_xmit_more_flush(tx_ring);
4c352362 1102
4c352362
JK
1103 return NETDEV_TX_OK;
1104
1105err_unmap:
eac2c68d 1106 while (--f >= 0) {
4c352362 1107 frag = &skb_shinfo(skb)->frags[f];
79c12a75 1108 dma_unmap_page(dp->dev, tx_ring->txbufs[wr_idx].dma_addr,
4c352362
JK
1109 skb_frag_size(frag), DMA_TO_DEVICE);
1110 tx_ring->txbufs[wr_idx].skb = NULL;
1111 tx_ring->txbufs[wr_idx].dma_addr = 0;
1112 tx_ring->txbufs[wr_idx].fidx = -2;
1113 wr_idx = wr_idx - 1;
1114 if (wr_idx < 0)
1115 wr_idx += tx_ring->cnt;
1116 }
79c12a75 1117 dma_unmap_single(dp->dev, tx_ring->txbufs[wr_idx].dma_addr,
4c352362
JK
1118 skb_headlen(skb), DMA_TO_DEVICE);
1119 tx_ring->txbufs[wr_idx].skb = NULL;
1120 tx_ring->txbufs[wr_idx].dma_addr = 0;
1121 tx_ring->txbufs[wr_idx].fidx = -2;
76581af2 1122err_dma_err:
79c12a75 1123 nn_dp_warn(dp, "Failed to map DMA TX buffer\n");
76581af2 1124err_flush:
28b0cfee 1125 nfp_net_tx_xmit_more_flush(tx_ring);
4c352362
JK
1126 u64_stats_update_begin(&r_vec->tx_sync);
1127 r_vec->tx_errors++;
1128 u64_stats_update_end(&r_vec->tx_sync);
5a4cea28 1129 nfp_net_tls_tx_undo(skb, tls_handle);
4c352362
JK
1130 dev_kfree_skb_any(skb);
1131 return NETDEV_TX_OK;
1132}
1133
1134/**
1135 * nfp_net_tx_complete() - Handled completed TX packets
d387b8a1
JK
1136 * @tx_ring: TX ring structure
1137 * @budget: NAPI budget (only used as bool to determine if in NAPI context)
4c352362 1138 */
d387b8a1 1139static void nfp_net_tx_complete(struct nfp_net_tx_ring *tx_ring, int budget)
4c352362
JK
1140{
1141 struct nfp_net_r_vector *r_vec = tx_ring->r_vec;
79c12a75 1142 struct nfp_net_dp *dp = &r_vec->nfp_net->dp;
4c352362
JK
1143 struct netdev_queue *nd_q;
1144 u32 done_pkts = 0, done_bytes = 0;
4c352362 1145 u32 qcp_rd_p;
de31049a 1146 int todo;
4c352362 1147
d38df0d3
JK
1148 if (tx_ring->wr_p == tx_ring->rd_p)
1149 return;
1150
4c352362
JK
1151 /* Work out how many descriptors have been transmitted */
1152 qcp_rd_p = nfp_qcp_rd_ptr_read(tx_ring->qcp_q);
1153
1154 if (qcp_rd_p == tx_ring->qcp_rd_p)
1155 return;
1156
770f0cea 1157 todo = D_IDX(tx_ring, qcp_rd_p - tx_ring->qcp_rd_p);
4c352362
JK
1158
1159 while (todo--) {
d7840976 1160 const skb_frag_t *frag;
de31049a
JK
1161 struct nfp_net_tx_buf *tx_buf;
1162 struct sk_buff *skb;
1163 int fidx, nr_frags;
1164 int idx;
1165
4aa3b766 1166 idx = D_IDX(tx_ring, tx_ring->rd_p++);
de31049a 1167 tx_buf = &tx_ring->txbufs[idx];
4c352362 1168
de31049a 1169 skb = tx_buf->skb;
4c352362
JK
1170 if (!skb)
1171 continue;
1172
1173 nr_frags = skb_shinfo(skb)->nr_frags;
de31049a 1174 fidx = tx_buf->fidx;
4c352362
JK
1175
1176 if (fidx == -1) {
1177 /* unmap head */
de31049a 1178 dma_unmap_single(dp->dev, tx_buf->dma_addr,
4c352362
JK
1179 skb_headlen(skb), DMA_TO_DEVICE);
1180
de31049a
JK
1181 done_pkts += tx_buf->pkt_cnt;
1182 done_bytes += tx_buf->real_len;
4c352362
JK
1183 } else {
1184 /* unmap fragment */
1185 frag = &skb_shinfo(skb)->frags[fidx];
de31049a 1186 dma_unmap_page(dp->dev, tx_buf->dma_addr,
4c352362
JK
1187 skb_frag_size(frag), DMA_TO_DEVICE);
1188 }
1189
1190 /* check for last gather fragment */
1191 if (fidx == nr_frags - 1)
d387b8a1 1192 napi_consume_skb(skb, budget);
4c352362 1193
de31049a
JK
1194 tx_buf->dma_addr = 0;
1195 tx_buf->skb = NULL;
1196 tx_buf->fidx = -2;
4c352362
JK
1197 }
1198
1199 tx_ring->qcp_rd_p = qcp_rd_p;
1200
1201 u64_stats_update_begin(&r_vec->tx_sync);
1202 r_vec->tx_bytes += done_bytes;
1203 r_vec->tx_pkts += done_pkts;
1204 u64_stats_update_end(&r_vec->tx_sync);
1205
77ece8d5
JK
1206 if (!dp->netdev)
1207 return;
1208
79c12a75 1209 nd_q = netdev_get_tx_queue(dp->netdev, tx_ring->idx);
4c352362
JK
1210 netdev_tx_completed_queue(nd_q, done_pkts, done_bytes);
1211 if (nfp_net_tx_ring_should_wake(tx_ring)) {
1212 /* Make sure TX thread will see updated tx_ring->rd_p */
1213 smp_mb();
1214
1215 if (unlikely(netif_tx_queue_stopped(nd_q)))
1216 netif_tx_wake_queue(nd_q);
1217 }
1218
1219 WARN_ONCE(tx_ring->wr_p - tx_ring->rd_p > tx_ring->cnt,
1220 "TX ring corruption rd_p=%u wr_p=%u cnt=%u\n",
1221 tx_ring->rd_p, tx_ring->wr_p, tx_ring->cnt);
1222}
1223
abeeec4a 1224static bool nfp_net_xdp_complete(struct nfp_net_tx_ring *tx_ring)
ecd63a02
JK
1225{
1226 struct nfp_net_r_vector *r_vec = tx_ring->r_vec;
ecd63a02 1227 u32 done_pkts = 0, done_bytes = 0;
abeeec4a 1228 bool done_all;
ecd63a02
JK
1229 int idx, todo;
1230 u32 qcp_rd_p;
1231
1232 /* Work out how many descriptors have been transmitted */
1233 qcp_rd_p = nfp_qcp_rd_ptr_read(tx_ring->qcp_q);
1234
1235 if (qcp_rd_p == tx_ring->qcp_rd_p)
abeeec4a 1236 return true;
ecd63a02 1237
770f0cea 1238 todo = D_IDX(tx_ring, qcp_rd_p - tx_ring->qcp_rd_p);
ecd63a02 1239
abeeec4a
JK
1240 done_all = todo <= NFP_NET_XDP_MAX_COMPLETE;
1241 todo = min(todo, NFP_NET_XDP_MAX_COMPLETE);
1242
4aa3b766 1243 tx_ring->qcp_rd_p = D_IDX(tx_ring, tx_ring->qcp_rd_p + todo);
abeeec4a 1244
92e68195 1245 done_pkts = todo;
ecd63a02 1246 while (todo--) {
4aa3b766 1247 idx = D_IDX(tx_ring, tx_ring->rd_p);
ecd63a02
JK
1248 tx_ring->rd_p++;
1249
ecd63a02 1250 done_bytes += tx_ring->txbufs[idx].real_len;
ecd63a02
JK
1251 }
1252
ecd63a02
JK
1253 u64_stats_update_begin(&r_vec->tx_sync);
1254 r_vec->tx_bytes += done_bytes;
1255 r_vec->tx_pkts += done_pkts;
1256 u64_stats_update_end(&r_vec->tx_sync);
1257
1258 WARN_ONCE(tx_ring->wr_p - tx_ring->rd_p > tx_ring->cnt,
abeeec4a 1259 "XDP TX ring corruption rd_p=%u wr_p=%u cnt=%u\n",
ecd63a02 1260 tx_ring->rd_p, tx_ring->wr_p, tx_ring->cnt);
abeeec4a
JK
1261
1262 return done_all;
ecd63a02
JK
1263}
1264
4c352362 1265/**
827deea9 1266 * nfp_net_tx_ring_reset() - Free any untransmitted buffers and reset pointers
79c12a75 1267 * @dp: NFP Net data path struct
827deea9 1268 * @tx_ring: TX ring structure
4c352362 1269 *
07300f77 1270 * Assumes that the device is stopped, must be idempotent.
4c352362 1271 */
827deea9 1272static void
79c12a75 1273nfp_net_tx_ring_reset(struct nfp_net_dp *dp, struct nfp_net_tx_ring *tx_ring)
4c352362 1274{
d7840976 1275 const skb_frag_t *frag;
ecd63a02 1276 struct netdev_queue *nd_q;
4c352362 1277
92e68195 1278 while (!tx_ring->is_xdp && tx_ring->rd_p != tx_ring->wr_p) {
ecd63a02 1279 struct nfp_net_tx_buf *tx_buf;
92e68195
JK
1280 struct sk_buff *skb;
1281 int idx, nr_frags;
4c352362 1282
4aa3b766 1283 idx = D_IDX(tx_ring, tx_ring->rd_p);
ecd63a02 1284 tx_buf = &tx_ring->txbufs[idx];
827deea9 1285
92e68195
JK
1286 skb = tx_ring->txbufs[idx].skb;
1287 nr_frags = skb_shinfo(skb)->nr_frags;
4c352362 1288
92e68195
JK
1289 if (tx_buf->fidx == -1) {
1290 /* unmap head */
1291 dma_unmap_single(dp->dev, tx_buf->dma_addr,
1292 skb_headlen(skb), DMA_TO_DEVICE);
1293 } else {
1294 /* unmap fragment */
1295 frag = &skb_shinfo(skb)->frags[tx_buf->fidx];
1296 dma_unmap_page(dp->dev, tx_buf->dma_addr,
1297 skb_frag_size(frag), DMA_TO_DEVICE);
ecd63a02 1298 }
827deea9 1299
92e68195
JK
1300 /* check for last gather fragment */
1301 if (tx_buf->fidx == nr_frags - 1)
1302 dev_kfree_skb_any(skb);
1303
ecd63a02
JK
1304 tx_buf->dma_addr = 0;
1305 tx_buf->skb = NULL;
1306 tx_buf->fidx = -2;
4c352362
JK
1307
1308 tx_ring->qcp_rd_p++;
1309 tx_ring->rd_p++;
1310 }
1311
5ea14712 1312 memset(tx_ring->txds, 0, tx_ring->size);
827deea9
JK
1313 tx_ring->wr_p = 0;
1314 tx_ring->rd_p = 0;
1315 tx_ring->qcp_rd_p = 0;
1316 tx_ring->wr_ptr_add = 0;
1317
77ece8d5 1318 if (tx_ring->is_xdp || !dp->netdev)
ecd63a02
JK
1319 return;
1320
79c12a75 1321 nd_q = netdev_get_tx_queue(dp->netdev, tx_ring->idx);
4c352362
JK
1322 netdev_tx_reset_queue(nd_q);
1323}
1324
0290bd29 1325static void nfp_net_tx_timeout(struct net_device *netdev, unsigned int txqueue)
4c352362
JK
1326{
1327 struct nfp_net *nn = netdev_priv(netdev);
4c352362 1328
d8968eda 1329 nn_warn(nn, "TX watchdog timeout on ring: %u\n", txqueue);
4c352362
JK
1330}
1331
1332/* Receive processing
1333 */
bf187ea0 1334static unsigned int
76e1e1a8 1335nfp_net_calc_fl_bufsz(struct nfp_net_dp *dp)
bf187ea0
JK
1336{
1337 unsigned int fl_bufsz;
1338
c0f031bc 1339 fl_bufsz = NFP_NET_RX_BUF_HEADROOM;
6fe0c3b4 1340 fl_bufsz += dp->rx_dma_off;
79c12a75 1341 if (dp->rx_offset == NFP_NET_CFG_RX_OFFSET_DYNAMIC)
c0f031bc 1342 fl_bufsz += NFP_NET_MAX_PREPEND;
bf187ea0 1343 else
79c12a75 1344 fl_bufsz += dp->rx_offset;
76e1e1a8 1345 fl_bufsz += ETH_HLEN + VLAN_HLEN * 2 + dp->mtu;
bf187ea0 1346
c0f031bc
JK
1347 fl_bufsz = SKB_DATA_ALIGN(fl_bufsz);
1348 fl_bufsz += SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
1349
bf187ea0
JK
1350 return fl_bufsz;
1351}
4c352362 1352
ecd63a02
JK
1353static void
1354nfp_net_free_frag(void *frag, bool xdp)
1355{
1356 if (!xdp)
1357 skb_free_frag(frag);
1358 else
1359 __free_page(virt_to_page(frag));
1360}
1361
4c352362 1362/**
c0f031bc 1363 * nfp_net_rx_alloc_one() - Allocate and map page frag for RX
783496b0 1364 * @dp: NFP Net data path struct
4c352362
JK
1365 * @dma_addr: Pointer to storage for DMA address (output param)
1366 *
c0f031bc 1367 * This function will allcate a new page frag, map it for DMA.
4c352362 1368 *
c0f031bc 1369 * Return: allocated page frag or NULL on failure.
4c352362 1370 */
d78005a5 1371static void *nfp_net_rx_alloc_one(struct nfp_net_dp *dp, dma_addr_t *dma_addr)
4c352362 1372{
c0f031bc 1373 void *frag;
4c352362 1374
5f0ca2fb 1375 if (!dp->xdp_prog) {
2195c263 1376 frag = netdev_alloc_frag(dp->fl_bufsz);
5f0ca2fb
JK
1377 } else {
1378 struct page *page;
1379
453f85d4 1380 page = alloc_page(GFP_KERNEL);
5f0ca2fb
JK
1381 frag = page ? page_address(page) : NULL;
1382 }
c0f031bc 1383 if (!frag) {
79c12a75 1384 nn_dp_warn(dp, "Failed to alloc receive page frag\n");
4c352362
JK
1385 return NULL;
1386 }
1387
c487e6b1 1388 *dma_addr = nfp_net_dma_map_rx(dp, frag);
79c12a75 1389 if (dma_mapping_error(dp->dev, *dma_addr)) {
9dc6b116 1390 nfp_net_free_frag(frag, dp->xdp_prog);
79c12a75 1391 nn_dp_warn(dp, "Failed to map DMA RX buffer\n");
4c352362
JK
1392 return NULL;
1393 }
1394
c0f031bc 1395 return frag;
4c352362
JK
1396}
1397
c487e6b1 1398static void *nfp_net_napi_alloc_one(struct nfp_net_dp *dp, dma_addr_t *dma_addr)
b64b7bb6
JK
1399{
1400 void *frag;
1401
5f0ca2fb 1402 if (!dp->xdp_prog) {
79c12a75 1403 frag = napi_alloc_frag(dp->fl_bufsz);
16f50cda
JK
1404 if (unlikely(!frag))
1405 return NULL;
5f0ca2fb
JK
1406 } else {
1407 struct page *page;
1408
790a3991 1409 page = dev_alloc_page();
16f50cda
JK
1410 if (unlikely(!page))
1411 return NULL;
1412 frag = page_address(page);
b64b7bb6
JK
1413 }
1414
c487e6b1 1415 *dma_addr = nfp_net_dma_map_rx(dp, frag);
79c12a75
JK
1416 if (dma_mapping_error(dp->dev, *dma_addr)) {
1417 nfp_net_free_frag(frag, dp->xdp_prog);
1418 nn_dp_warn(dp, "Failed to map DMA RX buffer\n");
b64b7bb6
JK
1419 return NULL;
1420 }
1421
1422 return frag;
1423}
1424
4c352362
JK
1425/**
1426 * nfp_net_rx_give_one() - Put mapped skb on the software and hardware rings
6fe0c3b4 1427 * @dp: NFP Net data path struct
4c352362 1428 * @rx_ring: RX ring structure
c0f031bc 1429 * @frag: page fragment buffer
4c352362
JK
1430 * @dma_addr: DMA address of skb mapping
1431 */
6fe0c3b4
JK
1432static void nfp_net_rx_give_one(const struct nfp_net_dp *dp,
1433 struct nfp_net_rx_ring *rx_ring,
c0f031bc 1434 void *frag, dma_addr_t dma_addr)
4c352362
JK
1435{
1436 unsigned int wr_idx;
1437
4aa3b766 1438 wr_idx = D_IDX(rx_ring, rx_ring->wr_p);
4c352362 1439
5cd4fbea
JK
1440 nfp_net_dma_sync_dev_rx(dp, dma_addr);
1441
4c352362 1442 /* Stash SKB and DMA address away */
c0f031bc 1443 rx_ring->rxbufs[wr_idx].frag = frag;
4c352362
JK
1444 rx_ring->rxbufs[wr_idx].dma_addr = dma_addr;
1445
1446 /* Fill freelist descriptor */
1447 rx_ring->rxds[wr_idx].fld.reserved = 0;
1448 rx_ring->rxds[wr_idx].fld.meta_len_dd = 0;
6fe0c3b4
JK
1449 nfp_desc_set_dma_addr(&rx_ring->rxds[wr_idx].fld,
1450 dma_addr + dp->rx_dma_off);
4c352362
JK
1451
1452 rx_ring->wr_p++;
9ed9ea70 1453 if (!(rx_ring->wr_p % NFP_NET_FL_BATCH)) {
4c352362
JK
1454 /* Update write pointer of the freelist queue. Make
1455 * sure all writes are flushed before telling the hardware.
1456 */
1457 wmb();
9ed9ea70 1458 nfp_qcp_wr_ptr_add(rx_ring->qcp_fl, NFP_NET_FL_BATCH);
4c352362
JK
1459 }
1460}
1461
1462/**
1934680f
JK
1463 * nfp_net_rx_ring_reset() - Reflect in SW state of freelist after disable
1464 * @rx_ring: RX ring structure
4c352362 1465 *
07300f77 1466 * Assumes that the device is stopped, must be idempotent.
4c352362 1467 */
1934680f 1468static void nfp_net_rx_ring_reset(struct nfp_net_rx_ring *rx_ring)
4c352362 1469{
1934680f 1470 unsigned int wr_idx, last_idx;
4c352362 1471
07300f77
JK
1472 /* wr_p == rd_p means ring was never fed FL bufs. RX rings are always
1473 * kept at cnt - 1 FL bufs.
1474 */
1475 if (rx_ring->wr_p == 0 && rx_ring->rd_p == 0)
1476 return;
1477
1934680f 1478 /* Move the empty entry to the end of the list */
4aa3b766 1479 wr_idx = D_IDX(rx_ring, rx_ring->wr_p);
1934680f
JK
1480 last_idx = rx_ring->cnt - 1;
1481 rx_ring->rxbufs[wr_idx].dma_addr = rx_ring->rxbufs[last_idx].dma_addr;
c0f031bc 1482 rx_ring->rxbufs[wr_idx].frag = rx_ring->rxbufs[last_idx].frag;
1934680f 1483 rx_ring->rxbufs[last_idx].dma_addr = 0;
c0f031bc 1484 rx_ring->rxbufs[last_idx].frag = NULL;
4c352362 1485
5ea14712 1486 memset(rx_ring->rxds, 0, rx_ring->size);
1934680f
JK
1487 rx_ring->wr_p = 0;
1488 rx_ring->rd_p = 0;
1934680f 1489}
4c352362 1490
1934680f
JK
1491/**
1492 * nfp_net_rx_ring_bufs_free() - Free any buffers currently on the RX ring
79c12a75 1493 * @dp: NFP Net data path struct
1934680f
JK
1494 * @rx_ring: RX ring to remove buffers from
1495 *
1496 * Assumes that the device is stopped and buffers are in [0, ring->cnt - 1)
1497 * entries. After device is disabled nfp_net_rx_ring_reset() must be called
1498 * to restore required ring geometry.
1499 */
1500static void
79c12a75 1501nfp_net_rx_ring_bufs_free(struct nfp_net_dp *dp,
9dc6b116 1502 struct nfp_net_rx_ring *rx_ring)
1934680f 1503{
1934680f 1504 unsigned int i;
4c352362 1505
1934680f
JK
1506 for (i = 0; i < rx_ring->cnt - 1; i++) {
1507 /* NULL skb can only happen when initial filling of the ring
1508 * fails to allocate enough buffers and calls here to free
1509 * already allocated ones.
1510 */
c0f031bc 1511 if (!rx_ring->rxbufs[i].frag)
1934680f
JK
1512 continue;
1513
c487e6b1 1514 nfp_net_dma_unmap_rx(dp, rx_ring->rxbufs[i].dma_addr);
9dc6b116 1515 nfp_net_free_frag(rx_ring->rxbufs[i].frag, dp->xdp_prog);
1934680f 1516 rx_ring->rxbufs[i].dma_addr = 0;
c0f031bc 1517 rx_ring->rxbufs[i].frag = NULL;
4c352362
JK
1518 }
1519}
1520
1521/**
1934680f 1522 * nfp_net_rx_ring_bufs_alloc() - Fill RX ring with buffers (don't give to FW)
79c12a75 1523 * @dp: NFP Net data path struct
1934680f 1524 * @rx_ring: RX ring to remove buffers from
4c352362 1525 */
1934680f 1526static int
79c12a75 1527nfp_net_rx_ring_bufs_alloc(struct nfp_net_dp *dp,
9dc6b116 1528 struct nfp_net_rx_ring *rx_ring)
4c352362 1529{
1934680f
JK
1530 struct nfp_net_rx_buf *rxbufs;
1531 unsigned int i;
1532
1533 rxbufs = rx_ring->rxbufs;
4c352362 1534
1934680f 1535 for (i = 0; i < rx_ring->cnt - 1; i++) {
d78005a5 1536 rxbufs[i].frag = nfp_net_rx_alloc_one(dp, &rxbufs[i].dma_addr);
c0f031bc 1537 if (!rxbufs[i].frag) {
9dc6b116 1538 nfp_net_rx_ring_bufs_free(dp, rx_ring);
4c352362
JK
1539 return -ENOMEM;
1540 }
4c352362
JK
1541 }
1542
1543 return 0;
1544}
1545
1934680f
JK
1546/**
1547 * nfp_net_rx_ring_fill_freelist() - Give buffers from the ring to FW
6fe0c3b4 1548 * @dp: NFP Net data path struct
1934680f
JK
1549 * @rx_ring: RX ring to fill
1550 */
6fe0c3b4
JK
1551static void
1552nfp_net_rx_ring_fill_freelist(struct nfp_net_dp *dp,
1553 struct nfp_net_rx_ring *rx_ring)
1934680f
JK
1554{
1555 unsigned int i;
1556
1557 for (i = 0; i < rx_ring->cnt - 1; i++)
6fe0c3b4 1558 nfp_net_rx_give_one(dp, rx_ring, rx_ring->rxbufs[i].frag,
1934680f
JK
1559 rx_ring->rxbufs[i].dma_addr);
1560}
1561
4c352362
JK
1562/**
1563 * nfp_net_rx_csum_has_errors() - group check if rxd has any csum errors
1564 * @flags: RX descriptor flags field in CPU byte order
1565 */
1566static int nfp_net_rx_csum_has_errors(u16 flags)
1567{
1568 u16 csum_all_checked, csum_all_ok;
1569
1570 csum_all_checked = flags & __PCIE_DESC_RX_CSUM_ALL;
1571 csum_all_ok = flags & __PCIE_DESC_RX_CSUM_ALL_OK;
1572
1573 return csum_all_checked != (csum_all_ok << PCIE_DESC_RX_CSUM_OK_SHIFT);
1574}
1575
1576/**
1577 * nfp_net_rx_csum() - set SKB checksum field based on RX descriptor flags
79c12a75 1578 * @dp: NFP Net data path struct
4c352362
JK
1579 * @r_vec: per-ring structure
1580 * @rxd: Pointer to RX descriptor
ddb98d94 1581 * @meta: Parsed metadata prepend
4c352362
JK
1582 * @skb: Pointer to SKB
1583 */
79c12a75
JK
1584static void nfp_net_rx_csum(struct nfp_net_dp *dp,
1585 struct nfp_net_r_vector *r_vec,
ddb98d94
JK
1586 struct nfp_net_rx_desc *rxd,
1587 struct nfp_meta_parsed *meta, struct sk_buff *skb)
4c352362
JK
1588{
1589 skb_checksum_none_assert(skb);
1590
79c12a75 1591 if (!(dp->netdev->features & NETIF_F_RXCSUM))
4c352362
JK
1592 return;
1593
ddb98d94
JK
1594 if (meta->csum_type) {
1595 skb->ip_summed = meta->csum_type;
1596 skb->csum = meta->csum;
1597 u64_stats_update_begin(&r_vec->rx_sync);
0df57e60 1598 r_vec->hw_csum_rx_complete++;
ddb98d94
JK
1599 u64_stats_update_end(&r_vec->rx_sync);
1600 return;
1601 }
1602
4c352362
JK
1603 if (nfp_net_rx_csum_has_errors(le16_to_cpu(rxd->rxd.flags))) {
1604 u64_stats_update_begin(&r_vec->rx_sync);
1605 r_vec->hw_csum_rx_error++;
1606 u64_stats_update_end(&r_vec->rx_sync);
1607 return;
1608 }
1609
1610 /* Assume that the firmware will never report inner CSUM_OK unless outer
1611 * L4 headers were successfully parsed. FW will always report zero UDP
1612 * checksum as CSUM_OK.
1613 */
1614 if (rxd->rxd.flags & PCIE_DESC_RX_TCP_CSUM_OK ||
1615 rxd->rxd.flags & PCIE_DESC_RX_UDP_CSUM_OK) {
1616 __skb_incr_checksum_unnecessary(skb);
1617 u64_stats_update_begin(&r_vec->rx_sync);
1618 r_vec->hw_csum_rx_ok++;
1619 u64_stats_update_end(&r_vec->rx_sync);
1620 }
1621
1622 if (rxd->rxd.flags & PCIE_DESC_RX_I_TCP_CSUM_OK ||
1623 rxd->rxd.flags & PCIE_DESC_RX_I_UDP_CSUM_OK) {
1624 __skb_incr_checksum_unnecessary(skb);
1625 u64_stats_update_begin(&r_vec->rx_sync);
1626 r_vec->hw_csum_rx_inner_ok++;
1627 u64_stats_update_end(&r_vec->rx_sync);
1628 }
1629}
1630
e524a6a9
JK
1631static void
1632nfp_net_set_hash(struct net_device *netdev, struct nfp_meta_parsed *meta,
1633 unsigned int type, __be32 *hash)
4c352362 1634{
19d0f54e 1635 if (!(netdev->features & NETIF_F_RXHASH))
4c352362
JK
1636 return;
1637
19d0f54e 1638 switch (type) {
4c352362
JK
1639 case NFP_NET_RSS_IPV4:
1640 case NFP_NET_RSS_IPV6:
1641 case NFP_NET_RSS_IPV6_EX:
e524a6a9 1642 meta->hash_type = PKT_HASH_TYPE_L3;
4c352362
JK
1643 break;
1644 default:
e524a6a9 1645 meta->hash_type = PKT_HASH_TYPE_L4;
4c352362
JK
1646 break;
1647 }
e524a6a9
JK
1648
1649 meta->hash = get_unaligned_be32(hash);
4c352362
JK
1650}
1651
19d0f54e 1652static void
e524a6a9 1653nfp_net_set_hash_desc(struct net_device *netdev, struct nfp_meta_parsed *meta,
b92fb77f 1654 void *data, struct nfp_net_rx_desc *rxd)
19d0f54e 1655{
b92fb77f 1656 struct nfp_net_rx_hash *rx_hash = data;
19d0f54e
JK
1657
1658 if (!(rxd->rxd.flags & PCIE_DESC_RX_RSS))
1659 return;
1660
e524a6a9 1661 nfp_net_set_hash(netdev, meta, get_unaligned_be32(&rx_hash->hash_type),
19d0f54e
JK
1662 &rx_hash->hash);
1663}
1664
572c7245 1665static bool
e524a6a9 1666nfp_net_parse_meta(struct net_device *netdev, struct nfp_meta_parsed *meta,
6a35ddc5 1667 void *data, void *pkt, unsigned int pkt_len, int meta_len)
19d0f54e 1668{
19d0f54e
JK
1669 u32 meta_info;
1670
1671 meta_info = get_unaligned_be32(data);
1672 data += 4;
1673
1674 while (meta_info) {
1675 switch (meta_info & NFP_NET_META_FIELD_MASK) {
1676 case NFP_NET_META_HASH:
1677 meta_info >>= NFP_NET_META_FIELD_SIZE;
e524a6a9 1678 nfp_net_set_hash(netdev, meta,
19d0f54e
JK
1679 meta_info & NFP_NET_META_FIELD_MASK,
1680 (__be32 *)data);
1681 data += 4;
1682 break;
1683 case NFP_NET_META_MARK:
e524a6a9 1684 meta->mark = get_unaligned_be32(data);
19d0f54e
JK
1685 data += 4;
1686 break;
91bf82ca
SH
1687 case NFP_NET_META_PORTID:
1688 meta->portid = get_unaligned_be32(data);
1689 data += 4;
1690 break;
ddb98d94
JK
1691 case NFP_NET_META_CSUM:
1692 meta->csum_type = CHECKSUM_COMPLETE;
1693 meta->csum =
1694 (__force __wsum)__get_unaligned_cpu32(data);
1695 data += 4;
1696 break;
6a35ddc5
JK
1697 case NFP_NET_META_RESYNC_INFO:
1698 if (nfp_net_tls_rx_resync_req(netdev, data, pkt,
1699 pkt_len))
1700 return NULL;
1701 data += sizeof(struct nfp_net_tls_resync_req);
1702 break;
19d0f54e 1703 default:
572c7245 1704 return true;
19d0f54e
JK
1705 }
1706
1707 meta_info >>= NFP_NET_META_FIELD_SIZE;
1708 }
1709
572c7245 1710 return data != pkt;
19d0f54e
JK
1711}
1712
e9949aeb 1713static void
6fe0c3b4
JK
1714nfp_net_rx_drop(const struct nfp_net_dp *dp, struct nfp_net_r_vector *r_vec,
1715 struct nfp_net_rx_ring *rx_ring, struct nfp_net_rx_buf *rxbuf,
1716 struct sk_buff *skb)
e9949aeb
JK
1717{
1718 u64_stats_update_begin(&r_vec->rx_sync);
1719 r_vec->rx_drops++;
16f50cda
JK
1720 /* If we have both skb and rxbuf the replacement buffer allocation
1721 * must have failed, count this as an alloc failure.
1722 */
1723 if (skb && rxbuf)
1724 r_vec->rx_replace_buf_alloc_fail++;
e9949aeb
JK
1725 u64_stats_update_end(&r_vec->rx_sync);
1726
c0f031bc
JK
1727 /* skb is build based on the frag, free_skb() would free the frag
1728 * so to be able to reuse it we need an extra ref.
1729 */
1730 if (skb && rxbuf && skb->head == rxbuf->frag)
1731 page_ref_inc(virt_to_head_page(rxbuf->frag));
e9949aeb 1732 if (rxbuf)
6fe0c3b4 1733 nfp_net_rx_give_one(dp, rx_ring, rxbuf->frag, rxbuf->dma_addr);
e9949aeb
JK
1734 if (skb)
1735 dev_kfree_skb_any(skb);
1736}
1737
a67edbf4 1738static bool
79c12a75 1739nfp_net_tx_xdp_buf(struct nfp_net_dp *dp, struct nfp_net_rx_ring *rx_ring,
ecd63a02 1740 struct nfp_net_tx_ring *tx_ring,
1abae319 1741 struct nfp_net_rx_buf *rxbuf, unsigned int dma_off,
abeeec4a 1742 unsigned int pkt_len, bool *completed)
ecd63a02 1743{
fa6540b8 1744 unsigned int dma_map_sz = dp->fl_bufsz - NFP_NET_RX_BUF_NON_DATA;
ecd63a02
JK
1745 struct nfp_net_tx_buf *txbuf;
1746 struct nfp_net_tx_desc *txd;
ecd63a02
JK
1747 int wr_idx;
1748
fa6540b8
JDB
1749 /* Reject if xdp_adjust_tail grow packet beyond DMA area */
1750 if (pkt_len + dma_off > dma_map_sz)
1751 return false;
1752
ecd63a02 1753 if (unlikely(nfp_net_tx_full(tx_ring, 1))) {
abeeec4a
JK
1754 if (!*completed) {
1755 nfp_net_xdp_complete(tx_ring);
1756 *completed = true;
1757 }
1758
1759 if (unlikely(nfp_net_tx_full(tx_ring, 1))) {
1760 nfp_net_rx_drop(dp, rx_ring->r_vec, rx_ring, rxbuf,
1761 NULL);
1762 return false;
1763 }
ecd63a02
JK
1764 }
1765
4aa3b766 1766 wr_idx = D_IDX(tx_ring, tx_ring->wr_p);
ecd63a02
JK
1767
1768 /* Stash the soft descriptor of the head then initialize it */
1769 txbuf = &tx_ring->txbufs[wr_idx];
92e68195
JK
1770
1771 nfp_net_rx_give_one(dp, rx_ring, txbuf->frag, txbuf->dma_addr);
1772
ecd63a02
JK
1773 txbuf->frag = rxbuf->frag;
1774 txbuf->dma_addr = rxbuf->dma_addr;
1775 txbuf->fidx = -1;
1776 txbuf->pkt_cnt = 1;
1777 txbuf->real_len = pkt_len;
1778
1abae319 1779 dma_sync_single_for_device(dp->dev, rxbuf->dma_addr + dma_off,
d58cebb7 1780 pkt_len, DMA_BIDIRECTIONAL);
ecd63a02
JK
1781
1782 /* Build TX descriptor */
1783 txd = &tx_ring->txds[wr_idx];
1784 txd->offset_eop = PCIE_DESC_TX_EOP;
1785 txd->dma_len = cpu_to_le16(pkt_len);
1abae319 1786 nfp_desc_set_dma_addr(txd, rxbuf->dma_addr + dma_off);
ecd63a02
JK
1787 txd->data_len = cpu_to_le16(pkt_len);
1788
1789 txd->flags = 0;
1790 txd->mss = 0;
e53fc9fa 1791 txd->lso_hdrlen = 0;
ecd63a02
JK
1792
1793 tx_ring->wr_p++;
1794 tx_ring->wr_ptr_add++;
a67edbf4 1795 return true;
ecd63a02
JK
1796}
1797
4c352362
JK
1798/**
1799 * nfp_net_rx() - receive up to @budget packets on @rx_ring
1800 * @rx_ring: RX ring to receive from
1801 * @budget: NAPI budget
1802 *
1803 * Note, this function is separated out from the napi poll function to
1804 * more cleanly separate packet receive code from other bookkeeping
1805 * functions performed in the napi poll function.
1806 *
4c352362
JK
1807 * Return: Number of packets received.
1808 */
1809static int nfp_net_rx(struct nfp_net_rx_ring *rx_ring, int budget)
1810{
1811 struct nfp_net_r_vector *r_vec = rx_ring->r_vec;
79c12a75 1812 struct nfp_net_dp *dp = &r_vec->nfp_net->dp;
ecd63a02
JK
1813 struct nfp_net_tx_ring *tx_ring;
1814 struct bpf_prog *xdp_prog;
abeeec4a 1815 bool xdp_tx_cmpl = false;
ecd63a02 1816 unsigned int true_bufsz;
c0f031bc 1817 struct sk_buff *skb;
416db5c1 1818 int pkts_polled = 0;
7f1c684a 1819 struct xdp_buff xdp;
4c352362
JK
1820 int idx;
1821
ecd63a02 1822 rcu_read_lock();
79c12a75 1823 xdp_prog = READ_ONCE(dp->xdp_prog);
79c12a75 1824 true_bufsz = xdp_prog ? PAGE_SIZE : dp->fl_bufsz;
fa6540b8 1825 xdp.frame_sz = PAGE_SIZE - NFP_NET_RX_BUF_HEADROOM;
7f1c684a 1826 xdp.rxq = &rx_ring->xdp_rxq;
ecd63a02
JK
1827 tx_ring = r_vec->xdp_ring;
1828
416db5c1 1829 while (pkts_polled < budget) {
5cd4fbea 1830 unsigned int meta_len, data_len, meta_off, pkt_len, pkt_off;
13df4c66
JK
1831 struct nfp_net_rx_buf *rxbuf;
1832 struct nfp_net_rx_desc *rxd;
e524a6a9 1833 struct nfp_meta_parsed meta;
27f54b58 1834 bool redir_egress = false;
91bf82ca 1835 struct net_device *netdev;
13df4c66 1836 dma_addr_t new_dma_addr;
65d88fd0 1837 u32 meta_len_xdp = 0;
13df4c66
JK
1838 void *new_frag;
1839
4aa3b766 1840 idx = D_IDX(rx_ring, rx_ring->rd_p);
4c352362
JK
1841
1842 rxd = &rx_ring->rxds[idx];
416db5c1 1843 if (!(rxd->rxd.meta_len_dd & PCIE_DESC_RX_DD))
4c352362 1844 break;
416db5c1 1845
4c352362
JK
1846 /* Memory barrier to ensure that we won't do other reads
1847 * before the DD bit.
1848 */
1849 dma_rmb();
1850
e524a6a9
JK
1851 memset(&meta, 0, sizeof(meta));
1852
4c352362
JK
1853 rx_ring->rd_p++;
1854 pkts_polled++;
4c352362 1855
c0f031bc 1856 rxbuf = &rx_ring->rxbufs[idx];
180012dc
JK
1857 /* < meta_len >
1858 * <-- [rx_offset] -->
1859 * ---------------------------------------------------------
1860 * | [XX] | metadata | packet | XXXX |
1861 * ---------------------------------------------------------
1862 * <---------------- data_len --------------->
1863 *
1864 * The rx_offset is fixed for all packets, the meta_len can vary
1865 * on a packet by packet basis. If rx_offset is set to zero
1866 * (_RX_OFFSET_DYNAMIC) metadata starts at the beginning of the
1867 * buffer and is immediately followed by the packet (no [XX]).
1868 */
4c352362
JK
1869 meta_len = rxd->rxd.meta_len_dd & PCIE_DESC_RX_META_LEN_MASK;
1870 data_len = le16_to_cpu(rxd->rxd.data_len);
13df4c66 1871 pkt_len = data_len - meta_len;
4c352362 1872
5cd4fbea 1873 pkt_off = NFP_NET_RX_BUF_HEADROOM + dp->rx_dma_off;
79c12a75 1874 if (dp->rx_offset == NFP_NET_CFG_RX_OFFSET_DYNAMIC)
5cd4fbea 1875 pkt_off += meta_len;
180012dc 1876 else
5cd4fbea
JK
1877 pkt_off += dp->rx_offset;
1878 meta_off = pkt_off - meta_len;
4c352362 1879
4c352362
JK
1880 /* Stats update */
1881 u64_stats_update_begin(&r_vec->rx_sync);
1882 r_vec->rx_pkts++;
13df4c66 1883 r_vec->rx_bytes += pkt_len;
4c352362
JK
1884 u64_stats_update_end(&r_vec->rx_sync);
1885
b92fb77f
JK
1886 if (unlikely(meta_len > NFP_NET_MAX_PREPEND ||
1887 (dp->rx_offset && meta_len > dp->rx_offset))) {
1888 nn_dp_warn(dp, "oversized RX packet metadata %u\n",
1889 meta_len);
6fe0c3b4 1890 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, NULL);
b92fb77f
JK
1891 continue;
1892 }
1893
5cd4fbea
JK
1894 nfp_net_dma_sync_cpu_rx(dp, rxbuf->dma_addr + meta_off,
1895 data_len);
1896
e524a6a9
JK
1897 if (!dp->chained_metadata_format) {
1898 nfp_net_set_hash_desc(dp->netdev, &meta,
1899 rxbuf->frag + meta_off, rxd);
1900 } else if (meta_len) {
572c7245
JK
1901 if (unlikely(nfp_net_parse_meta(dp->netdev, &meta,
1902 rxbuf->frag + meta_off,
1903 rxbuf->frag + pkt_off,
6a35ddc5 1904 pkt_len, meta_len))) {
e524a6a9
JK
1905 nn_dp_warn(dp, "invalid RX packet metadata\n");
1906 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf,
1907 NULL);
1908 continue;
1909 }
1910 }
1911
5f428401 1912 if (xdp_prog && !meta.portid) {
65d88fd0 1913 void *orig_data = rxbuf->frag + pkt_off;
1abae319 1914 unsigned int dma_off;
ecd63a02
JK
1915 int act;
1916
65d88fd0
DB
1917 xdp.data_hard_start = rxbuf->frag + NFP_NET_RX_BUF_HEADROOM;
1918 xdp.data = orig_data;
1919 xdp.data_meta = orig_data;
1920 xdp.data_end = orig_data + pkt_len;
1921
1922 act = bpf_prog_run_xdp(xdp_prog, &xdp);
1923
5a6a22e3 1924 pkt_len = xdp.data_end - xdp.data;
65d88fd0 1925 pkt_off += xdp.data - orig_data;
6fe0c3b4 1926
ecd63a02
JK
1927 switch (act) {
1928 case XDP_PASS:
65d88fd0 1929 meta_len_xdp = xdp.data - xdp.data_meta;
ecd63a02
JK
1930 break;
1931 case XDP_TX:
5cd4fbea 1932 dma_off = pkt_off - NFP_NET_RX_BUF_HEADROOM;
79c12a75 1933 if (unlikely(!nfp_net_tx_xdp_buf(dp, rx_ring,
a67edbf4 1934 tx_ring, rxbuf,
1abae319 1935 dma_off,
abeeec4a
JK
1936 pkt_len,
1937 &xdp_tx_cmpl)))
79c12a75
JK
1938 trace_xdp_exception(dp->netdev,
1939 xdp_prog, act);
ecd63a02
JK
1940 continue;
1941 default:
1942 bpf_warn_invalid_xdp_action(act);
df561f66 1943 fallthrough;
ecd63a02 1944 case XDP_ABORTED:
79c12a75 1945 trace_xdp_exception(dp->netdev, xdp_prog, act);
df561f66 1946 fallthrough;
ecd63a02 1947 case XDP_DROP:
6fe0c3b4 1948 nfp_net_rx_give_one(dp, rx_ring, rxbuf->frag,
ecd63a02
JK
1949 rxbuf->dma_addr);
1950 continue;
1951 }
1952 }
1953
78a8b760
JK
1954 if (likely(!meta.portid)) {
1955 netdev = dp->netdev;
79ca38e8
JK
1956 } else if (meta.portid == NFP_META_PORT_ID_CTRL) {
1957 struct nfp_net *nn = netdev_priv(dp->netdev);
1958
1959 nfp_app_ctrl_rx_raw(nn->app, rxbuf->frag + pkt_off,
1960 pkt_len);
1961 nfp_net_rx_give_one(dp, rx_ring, rxbuf->frag,
1962 rxbuf->dma_addr);
1963 continue;
78a8b760
JK
1964 } else {
1965 struct nfp_net *nn;
1966
1967 nn = netdev_priv(dp->netdev);
27f54b58
JH
1968 netdev = nfp_app_dev_get(nn->app, meta.portid,
1969 &redir_egress);
78a8b760
JK
1970 if (unlikely(!netdev)) {
1971 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf,
1972 NULL);
1973 continue;
1974 }
27f54b58
JH
1975
1976 if (nfp_netdev_is_nfp_repr(netdev))
1977 nfp_repr_inc_rx_stats(netdev, pkt_len);
78a8b760
JK
1978 }
1979
ecd63a02 1980 skb = build_skb(rxbuf->frag, true_bufsz);
13df4c66 1981 if (unlikely(!skb)) {
6fe0c3b4 1982 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, NULL);
13df4c66
JK
1983 continue;
1984 }
c487e6b1 1985 new_frag = nfp_net_napi_alloc_one(dp, &new_dma_addr);
13df4c66 1986 if (unlikely(!new_frag)) {
6fe0c3b4 1987 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, skb);
13df4c66
JK
1988 continue;
1989 }
1990
1691a4c0
JK
1991 nfp_net_dma_unmap_rx(dp, rxbuf->dma_addr);
1992
1993 nfp_net_rx_give_one(dp, rx_ring, new_frag, new_dma_addr);
1994
5cd4fbea 1995 skb_reserve(skb, pkt_off);
13df4c66
JK
1996 skb_put(skb, pkt_len);
1997
e524a6a9
JK
1998 skb->mark = meta.mark;
1999 skb_set_hash(skb, meta.hash, meta.hash_type);
19d0f54e 2000
4c352362 2001 skb_record_rx_queue(skb, rx_ring->idx);
91bf82ca 2002 skb->protocol = eth_type_trans(skb, netdev);
4c352362 2003
ddb98d94 2004 nfp_net_rx_csum(dp, r_vec, rxd, &meta, skb);
4c352362 2005
5bcb5c7e
DM
2006#ifdef CONFIG_TLS_DEVICE
2007 if (rxd->rxd.flags & PCIE_DESC_RX_DECRYPTED) {
2008 skb->decrypted = true;
2009 u64_stats_update_begin(&r_vec->rx_sync);
2010 r_vec->hw_tls_rx++;
2011 u64_stats_update_end(&r_vec->rx_sync);
2012 }
2013#endif
2014
4c352362
JK
2015 if (rxd->rxd.flags & PCIE_DESC_RX_VLAN)
2016 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2017 le16_to_cpu(rxd->rxd.vlan));
65d88fd0
DB
2018 if (meta_len_xdp)
2019 skb_metadata_set(skb, meta_len_xdp);
4c352362 2020
27f54b58
JH
2021 if (likely(!redir_egress)) {
2022 napi_gro_receive(&rx_ring->r_vec->napi, skb);
2023 } else {
2024 skb->dev = netdev;
dce5cccc 2025 skb_reset_network_header(skb);
27f54b58
JH
2026 __skb_push(skb, ETH_HLEN);
2027 dev_queue_xmit(skb);
2028 }
4c352362
JK
2029 }
2030
abeeec4a
JK
2031 if (xdp_prog) {
2032 if (tx_ring->wr_ptr_add)
2033 nfp_net_tx_xmit_more_flush(tx_ring);
2034 else if (unlikely(tx_ring->wr_p != tx_ring->rd_p) &&
2035 !xdp_tx_cmpl)
2036 if (!nfp_net_xdp_complete(tx_ring))
2037 pkts_polled = budget;
2038 }
ecd63a02
JK
2039 rcu_read_unlock();
2040
4c352362
JK
2041 return pkts_polled;
2042}
2043
2044/**
2045 * nfp_net_poll() - napi poll function
2046 * @napi: NAPI structure
2047 * @budget: NAPI budget
2048 *
2049 * Return: number of packets polled.
2050 */
2051static int nfp_net_poll(struct napi_struct *napi, int budget)
2052{
2053 struct nfp_net_r_vector *r_vec =
2054 container_of(napi, struct nfp_net_r_vector, napi);
cbeaf7aa 2055 unsigned int pkts_polled = 0;
4c352362 2056
cbeaf7aa 2057 if (r_vec->tx_ring)
d387b8a1 2058 nfp_net_tx_complete(r_vec->tx_ring, budget);
abeeec4a 2059 if (r_vec->rx_ring)
cbeaf7aa 2060 pkts_polled = nfp_net_rx(r_vec->rx_ring, budget);
4c352362 2061
7de5f115
JK
2062 if (pkts_polled < budget)
2063 if (napi_complete_done(napi, pkts_polled))
2064 nfp_net_irq_unmask(r_vec->nfp_net, r_vec->irq_entry);
4c352362
JK
2065
2066 return pkts_polled;
2067}
2068
77ece8d5
JK
2069/* Control device data path
2070 */
2071
2072static bool
2073nfp_ctrl_tx_one(struct nfp_net *nn, struct nfp_net_r_vector *r_vec,
2074 struct sk_buff *skb, bool old)
2075{
2076 unsigned int real_len = skb->len, meta_len = 0;
2077 struct nfp_net_tx_ring *tx_ring;
2078 struct nfp_net_tx_buf *txbuf;
2079 struct nfp_net_tx_desc *txd;
2080 struct nfp_net_dp *dp;
2081 dma_addr_t dma_addr;
2082 int wr_idx;
2083
2084 dp = &r_vec->nfp_net->dp;
2085 tx_ring = r_vec->tx_ring;
2086
2087 if (WARN_ON_ONCE(skb_shinfo(skb)->nr_frags)) {
2088 nn_dp_warn(dp, "Driver's CTRL TX does not implement gather\n");
2089 goto err_free;
2090 }
2091
2092 if (unlikely(nfp_net_tx_full(tx_ring, 1))) {
2093 u64_stats_update_begin(&r_vec->tx_sync);
2094 r_vec->tx_busy++;
2095 u64_stats_update_end(&r_vec->tx_sync);
2096 if (!old)
2097 __skb_queue_tail(&r_vec->queue, skb);
2098 else
2099 __skb_queue_head(&r_vec->queue, skb);
2100 return true;
2101 }
2102
2103 if (nfp_app_ctrl_has_meta(nn->app)) {
2104 if (unlikely(skb_headroom(skb) < 8)) {
2105 nn_dp_warn(dp, "CTRL TX on skb without headroom\n");
2106 goto err_free;
2107 }
2108 meta_len = 8;
2109 put_unaligned_be32(NFP_META_PORT_ID_CTRL, skb_push(skb, 4));
2110 put_unaligned_be32(NFP_NET_META_PORTID, skb_push(skb, 4));
2111 }
2112
2113 /* Start with the head skbuf */
2114 dma_addr = dma_map_single(dp->dev, skb->data, skb_headlen(skb),
2115 DMA_TO_DEVICE);
2116 if (dma_mapping_error(dp->dev, dma_addr))
2117 goto err_dma_warn;
2118
2119 wr_idx = D_IDX(tx_ring, tx_ring->wr_p);
2120
2121 /* Stash the soft descriptor of the head then initialize it */
2122 txbuf = &tx_ring->txbufs[wr_idx];
2123 txbuf->skb = skb;
2124 txbuf->dma_addr = dma_addr;
2125 txbuf->fidx = -1;
2126 txbuf->pkt_cnt = 1;
2127 txbuf->real_len = real_len;
2128
2129 /* Build TX descriptor */
2130 txd = &tx_ring->txds[wr_idx];
2131 txd->offset_eop = meta_len | PCIE_DESC_TX_EOP;
2132 txd->dma_len = cpu_to_le16(skb_headlen(skb));
2133 nfp_desc_set_dma_addr(txd, dma_addr);
2134 txd->data_len = cpu_to_le16(skb->len);
2135
2136 txd->flags = 0;
2137 txd->mss = 0;
2138 txd->lso_hdrlen = 0;
2139
2140 tx_ring->wr_p++;
2141 tx_ring->wr_ptr_add++;
2142 nfp_net_tx_xmit_more_flush(tx_ring);
2143
2144 return false;
2145
2146err_dma_warn:
2147 nn_dp_warn(dp, "Failed to DMA map TX CTRL buffer\n");
2148err_free:
2149 u64_stats_update_begin(&r_vec->tx_sync);
2150 r_vec->tx_errors++;
2151 u64_stats_update_end(&r_vec->tx_sync);
2152 dev_kfree_skb_any(skb);
2153 return false;
2154}
2155
d48ae231
JK
2156bool __nfp_ctrl_tx(struct nfp_net *nn, struct sk_buff *skb)
2157{
2158 struct nfp_net_r_vector *r_vec = &nn->r_vecs[0];
2159
2160 return nfp_ctrl_tx_one(nn, r_vec, skb, false);
2161}
2162
77ece8d5
JK
2163bool nfp_ctrl_tx(struct nfp_net *nn, struct sk_buff *skb)
2164{
2165 struct nfp_net_r_vector *r_vec = &nn->r_vecs[0];
2166 bool ret;
2167
2168 spin_lock_bh(&r_vec->lock);
2169 ret = nfp_ctrl_tx_one(nn, r_vec, skb, false);
2170 spin_unlock_bh(&r_vec->lock);
2171
2172 return ret;
2173}
2174
2175static void __nfp_ctrl_tx_queued(struct nfp_net_r_vector *r_vec)
2176{
2177 struct sk_buff *skb;
2178
2179 while ((skb = __skb_dequeue(&r_vec->queue)))
2180 if (nfp_ctrl_tx_one(r_vec->nfp_net, r_vec, skb, true))
2181 return;
2182}
2183
2184static bool
2185nfp_ctrl_meta_ok(struct nfp_net *nn, void *data, unsigned int meta_len)
2186{
2187 u32 meta_type, meta_tag;
2188
2189 if (!nfp_app_ctrl_has_meta(nn->app))
2190 return !meta_len;
2191
2192 if (meta_len != 8)
2193 return false;
2194
2195 meta_type = get_unaligned_be32(data);
2196 meta_tag = get_unaligned_be32(data + 4);
2197
2198 return (meta_type == NFP_NET_META_PORTID &&
2199 meta_tag == NFP_META_PORT_ID_CTRL);
2200}
2201
2202static bool
2203nfp_ctrl_rx_one(struct nfp_net *nn, struct nfp_net_dp *dp,
2204 struct nfp_net_r_vector *r_vec, struct nfp_net_rx_ring *rx_ring)
2205{
2206 unsigned int meta_len, data_len, meta_off, pkt_len, pkt_off;
2207 struct nfp_net_rx_buf *rxbuf;
2208 struct nfp_net_rx_desc *rxd;
2209 dma_addr_t new_dma_addr;
2210 struct sk_buff *skb;
2211 void *new_frag;
2212 int idx;
2213
2214 idx = D_IDX(rx_ring, rx_ring->rd_p);
2215
2216 rxd = &rx_ring->rxds[idx];
2217 if (!(rxd->rxd.meta_len_dd & PCIE_DESC_RX_DD))
2218 return false;
2219
2220 /* Memory barrier to ensure that we won't do other reads
2221 * before the DD bit.
2222 */
2223 dma_rmb();
2224
2225 rx_ring->rd_p++;
2226
2227 rxbuf = &rx_ring->rxbufs[idx];
2228 meta_len = rxd->rxd.meta_len_dd & PCIE_DESC_RX_META_LEN_MASK;
2229 data_len = le16_to_cpu(rxd->rxd.data_len);
2230 pkt_len = data_len - meta_len;
2231
2232 pkt_off = NFP_NET_RX_BUF_HEADROOM + dp->rx_dma_off;
2233 if (dp->rx_offset == NFP_NET_CFG_RX_OFFSET_DYNAMIC)
2234 pkt_off += meta_len;
2235 else
2236 pkt_off += dp->rx_offset;
2237 meta_off = pkt_off - meta_len;
2238
2239 /* Stats update */
2240 u64_stats_update_begin(&r_vec->rx_sync);
2241 r_vec->rx_pkts++;
2242 r_vec->rx_bytes += pkt_len;
2243 u64_stats_update_end(&r_vec->rx_sync);
2244
2245 nfp_net_dma_sync_cpu_rx(dp, rxbuf->dma_addr + meta_off, data_len);
2246
2247 if (unlikely(!nfp_ctrl_meta_ok(nn, rxbuf->frag + meta_off, meta_len))) {
2248 nn_dp_warn(dp, "incorrect metadata for ctrl packet (%d)\n",
2249 meta_len);
2250 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, NULL);
2251 return true;
2252 }
2253
2254 skb = build_skb(rxbuf->frag, dp->fl_bufsz);
2255 if (unlikely(!skb)) {
2256 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, NULL);
2257 return true;
2258 }
2259 new_frag = nfp_net_napi_alloc_one(dp, &new_dma_addr);
2260 if (unlikely(!new_frag)) {
2261 nfp_net_rx_drop(dp, r_vec, rx_ring, rxbuf, skb);
2262 return true;
2263 }
2264
2265 nfp_net_dma_unmap_rx(dp, rxbuf->dma_addr);
2266
2267 nfp_net_rx_give_one(dp, rx_ring, new_frag, new_dma_addr);
2268
2269 skb_reserve(skb, pkt_off);
2270 skb_put(skb, pkt_len);
2271
02082701 2272 nfp_app_ctrl_rx(nn->app, skb);
77ece8d5
JK
2273
2274 return true;
2275}
2276
ff58e2df 2277static bool nfp_ctrl_rx(struct nfp_net_r_vector *r_vec)
77ece8d5
JK
2278{
2279 struct nfp_net_rx_ring *rx_ring = r_vec->rx_ring;
2280 struct nfp_net *nn = r_vec->nfp_net;
2281 struct nfp_net_dp *dp = &nn->dp;
ff58e2df 2282 unsigned int budget = 512;
77ece8d5 2283
ff58e2df 2284 while (nfp_ctrl_rx_one(nn, dp, r_vec, rx_ring) && budget--)
77ece8d5 2285 continue;
ff58e2df
JK
2286
2287 return budget;
77ece8d5
JK
2288}
2289
2290static void nfp_ctrl_poll(unsigned long arg)
2291{
2292 struct nfp_net_r_vector *r_vec = (void *)arg;
2293
6577b0f7 2294 spin_lock(&r_vec->lock);
d387b8a1 2295 nfp_net_tx_complete(r_vec->tx_ring, 0);
77ece8d5 2296 __nfp_ctrl_tx_queued(r_vec);
6577b0f7 2297 spin_unlock(&r_vec->lock);
77ece8d5 2298
ff58e2df
JK
2299 if (nfp_ctrl_rx(r_vec)) {
2300 nfp_net_irq_unmask(r_vec->nfp_net, r_vec->irq_entry);
2301 } else {
2302 tasklet_schedule(&r_vec->tasklet);
2303 nn_dp_warn(&r_vec->nfp_net->dp,
2304 "control message budget exceeded!\n");
2305 }
77ece8d5
JK
2306}
2307
4c352362
JK
2308/* Setup and Configuration
2309 */
2310
cd083ce1
JK
2311/**
2312 * nfp_net_vecs_init() - Assign IRQs and setup rvecs.
2313 * @nn: NFP Network structure
2314 */
2315static void nfp_net_vecs_init(struct nfp_net *nn)
2316{
2317 struct nfp_net_r_vector *r_vec;
2318 int r;
2319
2320 nn->lsc_handler = nfp_net_irq_lsc;
2321 nn->exn_handler = nfp_net_irq_exn;
2322
2323 for (r = 0; r < nn->max_r_vecs; r++) {
2324 struct msix_entry *entry;
2325
2326 entry = &nn->irq_entries[NFP_NET_NON_Q_VECTORS + r];
2327
2328 r_vec = &nn->r_vecs[r];
2329 r_vec->nfp_net = nn;
cd083ce1
JK
2330 r_vec->irq_entry = entry->entry;
2331 r_vec->irq_vector = entry->vector;
2332
77ece8d5
JK
2333 if (nn->dp.netdev) {
2334 r_vec->handler = nfp_net_irq_rxtx;
2335 } else {
2336 r_vec->handler = nfp_ctrl_irq_rxtx;
2337
2338 __skb_queue_head_init(&r_vec->queue);
2339 spin_lock_init(&r_vec->lock);
2340 tasklet_init(&r_vec->tasklet, nfp_ctrl_poll,
2341 (unsigned long)r_vec);
2342 tasklet_disable(&r_vec->tasklet);
2343 }
2344
cd083ce1
JK
2345 cpumask_set_cpu(r, &r_vec->affinity_mask);
2346 }
2347}
2348
4c352362
JK
2349/**
2350 * nfp_net_tx_ring_free() - Free resources allocated to a TX ring
2351 * @tx_ring: TX ring to free
2352 */
2353static void nfp_net_tx_ring_free(struct nfp_net_tx_ring *tx_ring)
2354{
2355 struct nfp_net_r_vector *r_vec = tx_ring->r_vec;
79c12a75 2356 struct nfp_net_dp *dp = &r_vec->nfp_net->dp;
4c352362 2357
46627170 2358 kvfree(tx_ring->txbufs);
4c352362
JK
2359
2360 if (tx_ring->txds)
79c12a75 2361 dma_free_coherent(dp->dev, tx_ring->size,
4c352362
JK
2362 tx_ring->txds, tx_ring->dma);
2363
2364 tx_ring->cnt = 0;
4c352362
JK
2365 tx_ring->txbufs = NULL;
2366 tx_ring->txds = NULL;
2367 tx_ring->dma = 0;
2368 tx_ring->size = 0;
2369}
2370
2371/**
2372 * nfp_net_tx_ring_alloc() - Allocate resource for a TX ring
892a7f70 2373 * @dp: NFP Net data path struct
4c352362
JK
2374 * @tx_ring: TX Ring structure to allocate
2375 *
2376 * Return: 0 on success, negative errno otherwise.
2377 */
ecd63a02 2378static int
92e68195 2379nfp_net_tx_ring_alloc(struct nfp_net_dp *dp, struct nfp_net_tx_ring *tx_ring)
4c352362
JK
2380{
2381 struct nfp_net_r_vector *r_vec = tx_ring->r_vec;
4c352362 2382
892a7f70 2383 tx_ring->cnt = dp->txd_cnt;
4c352362 2384
5ea14712 2385 tx_ring->size = array_size(tx_ring->cnt, sizeof(*tx_ring->txds));
750afb08
LC
2386 tx_ring->txds = dma_alloc_coherent(dp->dev, tx_ring->size,
2387 &tx_ring->dma,
2388 GFP_KERNEL | __GFP_NOWARN);
23d9f553
JK
2389 if (!tx_ring->txds) {
2390 netdev_warn(dp->netdev, "failed to allocate TX descriptor ring memory, requested descriptor count: %d, consider lowering descriptor count\n",
2391 tx_ring->cnt);
4c352362 2392 goto err_alloc;
23d9f553 2393 }
4c352362 2394
46627170
JK
2395 tx_ring->txbufs = kvcalloc(tx_ring->cnt, sizeof(*tx_ring->txbufs),
2396 GFP_KERNEL);
4c352362
JK
2397 if (!tx_ring->txbufs)
2398 goto err_alloc;
2399
a7b1ad08 2400 if (!tx_ring->is_xdp && dp->netdev)
79c12a75 2401 netif_set_xps_queue(dp->netdev, &r_vec->affinity_mask,
ecd63a02 2402 tx_ring->idx);
4c352362 2403
4c352362
JK
2404 return 0;
2405
2406err_alloc:
2407 nfp_net_tx_ring_free(tx_ring);
2408 return -ENOMEM;
2409}
2410
92e68195
JK
2411static void
2412nfp_net_tx_ring_bufs_free(struct nfp_net_dp *dp,
2413 struct nfp_net_tx_ring *tx_ring)
2414{
2415 unsigned int i;
2416
2417 if (!tx_ring->is_xdp)
2418 return;
2419
2420 for (i = 0; i < tx_ring->cnt; i++) {
2421 if (!tx_ring->txbufs[i].frag)
2422 return;
2423
2424 nfp_net_dma_unmap_rx(dp, tx_ring->txbufs[i].dma_addr);
2425 __free_page(virt_to_page(tx_ring->txbufs[i].frag));
2426 }
2427}
2428
2429static int
2430nfp_net_tx_ring_bufs_alloc(struct nfp_net_dp *dp,
2431 struct nfp_net_tx_ring *tx_ring)
2432{
2433 struct nfp_net_tx_buf *txbufs = tx_ring->txbufs;
2434 unsigned int i;
2435
2436 if (!tx_ring->is_xdp)
2437 return 0;
2438
2439 for (i = 0; i < tx_ring->cnt; i++) {
2440 txbufs[i].frag = nfp_net_rx_alloc_one(dp, &txbufs[i].dma_addr);
2441 if (!txbufs[i].frag) {
2442 nfp_net_tx_ring_bufs_free(dp, tx_ring);
2443 return -ENOMEM;
2444 }
2445 }
2446
2447 return 0;
2448}
2449
892a7f70 2450static int nfp_net_tx_rings_prepare(struct nfp_net *nn, struct nfp_net_dp *dp)
cc7c0333 2451{
cc7c0333
JK
2452 unsigned int r;
2453
892a7f70
JK
2454 dp->tx_rings = kcalloc(dp->num_tx_rings, sizeof(*dp->tx_rings),
2455 GFP_KERNEL);
2456 if (!dp->tx_rings)
2457 return -ENOMEM;
cc7c0333 2458
892a7f70 2459 for (r = 0; r < dp->num_tx_rings; r++) {
ecd63a02
JK
2460 int bias = 0;
2461
512e94dc
JK
2462 if (r >= dp->num_stack_tx_rings)
2463 bias = dp->num_stack_tx_rings;
cc7c0333 2464
892a7f70 2465 nfp_net_tx_ring_init(&dp->tx_rings[r], &nn->r_vecs[r - bias],
92e68195 2466 r, bias);
ecd63a02 2467
92e68195 2468 if (nfp_net_tx_ring_alloc(dp, &dp->tx_rings[r]))
cc7c0333 2469 goto err_free_prev;
92e68195
JK
2470
2471 if (nfp_net_tx_ring_bufs_alloc(dp, &dp->tx_rings[r]))
2472 goto err_free_ring;
cc7c0333
JK
2473 }
2474
892a7f70 2475 return 0;
cc7c0333
JK
2476
2477err_free_prev:
92e68195
JK
2478 while (r--) {
2479 nfp_net_tx_ring_bufs_free(dp, &dp->tx_rings[r]);
2480err_free_ring:
892a7f70 2481 nfp_net_tx_ring_free(&dp->tx_rings[r]);
92e68195 2482 }
892a7f70
JK
2483 kfree(dp->tx_rings);
2484 return -ENOMEM;
cc7c0333
JK
2485}
2486
892a7f70 2487static void nfp_net_tx_rings_free(struct nfp_net_dp *dp)
cc7c0333
JK
2488{
2489 unsigned int r;
2490
92e68195
JK
2491 for (r = 0; r < dp->num_tx_rings; r++) {
2492 nfp_net_tx_ring_bufs_free(dp, &dp->tx_rings[r]);
892a7f70 2493 nfp_net_tx_ring_free(&dp->tx_rings[r]);
92e68195 2494 }
cc7c0333 2495
892a7f70 2496 kfree(dp->tx_rings);
cc7c0333
JK
2497}
2498
4c352362
JK
2499/**
2500 * nfp_net_rx_ring_free() - Free resources allocated to a RX ring
2501 * @rx_ring: RX ring to free
2502 */
2503static void nfp_net_rx_ring_free(struct nfp_net_rx_ring *rx_ring)
2504{
2505 struct nfp_net_r_vector *r_vec = rx_ring->r_vec;
79c12a75 2506 struct nfp_net_dp *dp = &r_vec->nfp_net->dp;
4c352362 2507
a9c324be
JK
2508 if (dp->netdev)
2509 xdp_rxq_info_unreg(&rx_ring->xdp_rxq);
46627170 2510 kvfree(rx_ring->rxbufs);
4c352362
JK
2511
2512 if (rx_ring->rxds)
79c12a75 2513 dma_free_coherent(dp->dev, rx_ring->size,
4c352362
JK
2514 rx_ring->rxds, rx_ring->dma);
2515
2516 rx_ring->cnt = 0;
4c352362
JK
2517 rx_ring->rxbufs = NULL;
2518 rx_ring->rxds = NULL;
2519 rx_ring->dma = 0;
2520 rx_ring->size = 0;
2521}
2522
2523/**
2524 * nfp_net_rx_ring_alloc() - Allocate resource for a RX ring
2195c263 2525 * @dp: NFP Net data path struct
4c352362
JK
2526 * @rx_ring: RX ring to allocate
2527 *
2528 * Return: 0 on success, negative errno otherwise.
2529 */
30d21171 2530static int
892a7f70 2531nfp_net_rx_ring_alloc(struct nfp_net_dp *dp, struct nfp_net_rx_ring *rx_ring)
4c352362 2532{
46627170 2533 int err;
7f1c684a 2534
a9c324be
JK
2535 if (dp->netdev) {
2536 err = xdp_rxq_info_reg(&rx_ring->xdp_rxq, dp->netdev,
2537 rx_ring->idx);
2538 if (err < 0)
2539 return err;
2540 }
4c352362 2541
892a7f70 2542 rx_ring->cnt = dp->rxd_cnt;
5ea14712 2543 rx_ring->size = array_size(rx_ring->cnt, sizeof(*rx_ring->rxds));
750afb08
LC
2544 rx_ring->rxds = dma_alloc_coherent(dp->dev, rx_ring->size,
2545 &rx_ring->dma,
2546 GFP_KERNEL | __GFP_NOWARN);
23d9f553
JK
2547 if (!rx_ring->rxds) {
2548 netdev_warn(dp->netdev, "failed to allocate RX descriptor ring memory, requested descriptor count: %d, consider lowering descriptor count\n",
2549 rx_ring->cnt);
4c352362 2550 goto err_alloc;
23d9f553 2551 }
4c352362 2552
46627170
JK
2553 rx_ring->rxbufs = kvcalloc(rx_ring->cnt, sizeof(*rx_ring->rxbufs),
2554 GFP_KERNEL);
4c352362
JK
2555 if (!rx_ring->rxbufs)
2556 goto err_alloc;
2557
4c352362
JK
2558 return 0;
2559
2560err_alloc:
2561 nfp_net_rx_ring_free(rx_ring);
2562 return -ENOMEM;
2563}
2564
892a7f70 2565static int nfp_net_rx_rings_prepare(struct nfp_net *nn, struct nfp_net_dp *dp)
36a857e4 2566{
36a857e4
JK
2567 unsigned int r;
2568
892a7f70
JK
2569 dp->rx_rings = kcalloc(dp->num_rx_rings, sizeof(*dp->rx_rings),
2570 GFP_KERNEL);
2571 if (!dp->rx_rings)
2572 return -ENOMEM;
36a857e4 2573
892a7f70
JK
2574 for (r = 0; r < dp->num_rx_rings; r++) {
2575 nfp_net_rx_ring_init(&dp->rx_rings[r], &nn->r_vecs[r], r);
36a857e4 2576
892a7f70 2577 if (nfp_net_rx_ring_alloc(dp, &dp->rx_rings[r]))
36a857e4
JK
2578 goto err_free_prev;
2579
892a7f70 2580 if (nfp_net_rx_ring_bufs_alloc(dp, &dp->rx_rings[r]))
36a857e4
JK
2581 goto err_free_ring;
2582 }
2583
892a7f70 2584 return 0;
36a857e4
JK
2585
2586err_free_prev:
2587 while (r--) {
892a7f70 2588 nfp_net_rx_ring_bufs_free(dp, &dp->rx_rings[r]);
36a857e4 2589err_free_ring:
892a7f70 2590 nfp_net_rx_ring_free(&dp->rx_rings[r]);
36a857e4 2591 }
892a7f70
JK
2592 kfree(dp->rx_rings);
2593 return -ENOMEM;
36a857e4
JK
2594}
2595
892a7f70 2596static void nfp_net_rx_rings_free(struct nfp_net_dp *dp)
36a857e4
JK
2597{
2598 unsigned int r;
2599
892a7f70
JK
2600 for (r = 0; r < dp->num_rx_rings; r++) {
2601 nfp_net_rx_ring_bufs_free(dp, &dp->rx_rings[r]);
2602 nfp_net_rx_ring_free(&dp->rx_rings[r]);
36a857e4
JK
2603 }
2604
892a7f70 2605 kfree(dp->rx_rings);
36a857e4
JK
2606}
2607
e31230f9 2608static void
79c12a75
JK
2609nfp_net_vector_assign_rings(struct nfp_net_dp *dp,
2610 struct nfp_net_r_vector *r_vec, int idx)
e31230f9 2611{
79c12a75 2612 r_vec->rx_ring = idx < dp->num_rx_rings ? &dp->rx_rings[idx] : NULL;
ecd63a02 2613 r_vec->tx_ring =
79c12a75 2614 idx < dp->num_stack_tx_rings ? &dp->tx_rings[idx] : NULL;
ecd63a02 2615
79c12a75
JK
2616 r_vec->xdp_ring = idx < dp->num_tx_rings - dp->num_stack_tx_rings ?
2617 &dp->tx_rings[dp->num_stack_tx_rings + idx] : NULL;
e31230f9
JK
2618}
2619
0afbfb18
JK
2620static int
2621nfp_net_prepare_vector(struct nfp_net *nn, struct nfp_net_r_vector *r_vec,
2622 int idx)
4c352362 2623{
0afbfb18 2624 int err;
4c352362 2625
164d1e9e 2626 /* Setup NAPI */
77ece8d5
JK
2627 if (nn->dp.netdev)
2628 netif_napi_add(nn->dp.netdev, &r_vec->napi,
2629 nfp_net_poll, NAPI_POLL_WEIGHT);
2630 else
2631 tasklet_enable(&r_vec->tasklet);
164d1e9e 2632
0afbfb18 2633 snprintf(r_vec->name, sizeof(r_vec->name),
77ece8d5 2634 "%s-rxtx-%d", nfp_net_name(nn), idx);
fdace6c2
JK
2635 err = request_irq(r_vec->irq_vector, r_vec->handler, 0, r_vec->name,
2636 r_vec);
0afbfb18 2637 if (err) {
77ece8d5
JK
2638 if (nn->dp.netdev)
2639 netif_napi_del(&r_vec->napi);
2640 else
2641 tasklet_disable(&r_vec->tasklet);
2642
fdace6c2 2643 nn_err(nn, "Error requesting IRQ %d\n", r_vec->irq_vector);
0afbfb18
JK
2644 return err;
2645 }
fdace6c2 2646 disable_irq(r_vec->irq_vector);
4c352362 2647
fdace6c2 2648 irq_set_affinity_hint(r_vec->irq_vector, &r_vec->affinity_mask);
4c352362 2649
fdace6c2
JK
2650 nn_dbg(nn, "RV%02d: irq=%03d/%03d\n", idx, r_vec->irq_vector,
2651 r_vec->irq_entry);
4c352362 2652
0afbfb18 2653 return 0;
4c352362
JK
2654}
2655
0afbfb18
JK
2656static void
2657nfp_net_cleanup_vector(struct nfp_net *nn, struct nfp_net_r_vector *r_vec)
4c352362 2658{
fdace6c2 2659 irq_set_affinity_hint(r_vec->irq_vector, NULL);
77ece8d5
JK
2660 if (nn->dp.netdev)
2661 netif_napi_del(&r_vec->napi);
2662 else
2663 tasklet_disable(&r_vec->tasklet);
2664
fdace6c2 2665 free_irq(r_vec->irq_vector, r_vec);
4c352362
JK
2666}
2667
2668/**
2669 * nfp_net_rss_write_itbl() - Write RSS indirection table to device
2670 * @nn: NFP Net device to reconfigure
2671 */
2672void nfp_net_rss_write_itbl(struct nfp_net *nn)
2673{
2674 int i;
2675
2676 for (i = 0; i < NFP_NET_CFG_RSS_ITBL_SZ; i += 4)
2677 nn_writel(nn, NFP_NET_CFG_RSS_ITBL + i,
2678 get_unaligned_le32(nn->rss_itbl + i));
2679}
2680
2681/**
2682 * nfp_net_rss_write_key() - Write RSS hash key to device
2683 * @nn: NFP Net device to reconfigure
2684 */
2685void nfp_net_rss_write_key(struct nfp_net *nn)
2686{
2687 int i;
2688
9ff304bf 2689 for (i = 0; i < nfp_net_rss_key_sz(nn); i += 4)
4c352362
JK
2690 nn_writel(nn, NFP_NET_CFG_RSS_KEY + i,
2691 get_unaligned_le32(nn->rss_key + i));
2692}
2693
2694/**
2695 * nfp_net_coalesce_write_cfg() - Write irq coalescence configuration to HW
2696 * @nn: NFP Net device to reconfigure
2697 */
2698void nfp_net_coalesce_write_cfg(struct nfp_net *nn)
2699{
2700 u8 i;
2701 u32 factor;
2702 u32 value;
2703
2704 /* Compute factor used to convert coalesce '_usecs' parameters to
2705 * ME timestamp ticks. There are 16 ME clock cycles for each timestamp
2706 * count.
2707 */
ce991ab6 2708 factor = nn->tlv_caps.me_freq_mhz / 16;
4c352362
JK
2709
2710 /* copy RX interrupt coalesce parameters */
2711 value = (nn->rx_coalesce_max_frames << 16) |
2712 (factor * nn->rx_coalesce_usecs);
79c12a75 2713 for (i = 0; i < nn->dp.num_rx_rings; i++)
4c352362
JK
2714 nn_writel(nn, NFP_NET_CFG_RXR_IRQ_MOD(i), value);
2715
2716 /* copy TX interrupt coalesce parameters */
2717 value = (nn->tx_coalesce_max_frames << 16) |
2718 (factor * nn->tx_coalesce_usecs);
79c12a75 2719 for (i = 0; i < nn->dp.num_tx_rings; i++)
4c352362
JK
2720 nn_writel(nn, NFP_NET_CFG_TXR_IRQ_MOD(i), value);
2721}
2722
2723/**
f642963b 2724 * nfp_net_write_mac_addr() - Write mac address to the device control BAR
4c352362 2725 * @nn: NFP Net device to reconfigure
9d372759 2726 * @addr: MAC address to write
4c352362 2727 *
f642963b
JK
2728 * Writes the MAC address from the netdev to the device control BAR. Does not
2729 * perform the required reconfig. We do a bit of byte swapping dance because
2730 * firmware is LE.
4c352362 2731 */
9d372759 2732static void nfp_net_write_mac_addr(struct nfp_net *nn, const u8 *addr)
4c352362 2733{
9d372759
PC
2734 nn_writel(nn, NFP_NET_CFG_MACADDR + 0, get_unaligned_be32(addr));
2735 nn_writew(nn, NFP_NET_CFG_MACADDR + 6, get_unaligned_be16(addr + 4));
4c352362
JK
2736}
2737
ca40feab
JK
2738static void nfp_net_vec_clear_ring_data(struct nfp_net *nn, unsigned int idx)
2739{
2740 nn_writeq(nn, NFP_NET_CFG_RXR_ADDR(idx), 0);
2741 nn_writeb(nn, NFP_NET_CFG_RXR_SZ(idx), 0);
2742 nn_writeb(nn, NFP_NET_CFG_RXR_VEC(idx), 0);
2743
2744 nn_writeq(nn, NFP_NET_CFG_TXR_ADDR(idx), 0);
2745 nn_writeb(nn, NFP_NET_CFG_TXR_SZ(idx), 0);
2746 nn_writeb(nn, NFP_NET_CFG_TXR_VEC(idx), 0);
2747}
2748
4c352362
JK
2749/**
2750 * nfp_net_clear_config_and_disable() - Clear control BAR and disable NFP
2751 * @nn: NFP Net device to reconfigure
07300f77
JK
2752 *
2753 * Warning: must be fully idempotent.
4c352362
JK
2754 */
2755static void nfp_net_clear_config_and_disable(struct nfp_net *nn)
2756{
2757 u32 new_ctrl, update;
ca40feab 2758 unsigned int r;
4c352362
JK
2759 int err;
2760
79c12a75 2761 new_ctrl = nn->dp.ctrl;
4c352362
JK
2762 new_ctrl &= ~NFP_NET_CFG_CTRL_ENABLE;
2763 update = NFP_NET_CFG_UPDATE_GEN;
2764 update |= NFP_NET_CFG_UPDATE_MSIX;
2765 update |= NFP_NET_CFG_UPDATE_RING;
2766
2767 if (nn->cap & NFP_NET_CFG_CTRL_RINGCFG)
2768 new_ctrl &= ~NFP_NET_CFG_CTRL_RINGCFG;
2769
2770 nn_writeq(nn, NFP_NET_CFG_TXRS_ENABLE, 0);
2771 nn_writeq(nn, NFP_NET_CFG_RXRS_ENABLE, 0);
2772
2773 nn_writel(nn, NFP_NET_CFG_CTRL, new_ctrl);
2774 err = nfp_net_reconfig(nn, update);
aba52df8 2775 if (err)
4c352362 2776 nn_err(nn, "Could not disable device: %d\n", err);
4c352362 2777
79c12a75
JK
2778 for (r = 0; r < nn->dp.num_rx_rings; r++)
2779 nfp_net_rx_ring_reset(&nn->dp.rx_rings[r]);
2780 for (r = 0; r < nn->dp.num_tx_rings; r++)
2781 nfp_net_tx_ring_reset(&nn->dp, &nn->dp.tx_rings[r]);
2782 for (r = 0; r < nn->dp.num_r_vecs; r++)
ca40feab
JK
2783 nfp_net_vec_clear_ring_data(nn, r);
2784
79c12a75 2785 nn->dp.ctrl = new_ctrl;
4c352362
JK
2786}
2787
ca40feab 2788static void
cbeaf7aa
JK
2789nfp_net_rx_ring_hw_cfg_write(struct nfp_net *nn,
2790 struct nfp_net_rx_ring *rx_ring, unsigned int idx)
ca40feab
JK
2791{
2792 /* Write the DMA address, size and MSI-X info to the device */
cbeaf7aa
JK
2793 nn_writeq(nn, NFP_NET_CFG_RXR_ADDR(idx), rx_ring->dma);
2794 nn_writeb(nn, NFP_NET_CFG_RXR_SZ(idx), ilog2(rx_ring->cnt));
fdace6c2 2795 nn_writeb(nn, NFP_NET_CFG_RXR_VEC(idx), rx_ring->r_vec->irq_entry);
cbeaf7aa 2796}
ca40feab 2797
cbeaf7aa
JK
2798static void
2799nfp_net_tx_ring_hw_cfg_write(struct nfp_net *nn,
2800 struct nfp_net_tx_ring *tx_ring, unsigned int idx)
2801{
2802 nn_writeq(nn, NFP_NET_CFG_TXR_ADDR(idx), tx_ring->dma);
2803 nn_writeb(nn, NFP_NET_CFG_TXR_SZ(idx), ilog2(tx_ring->cnt));
fdace6c2 2804 nn_writeb(nn, NFP_NET_CFG_TXR_VEC(idx), tx_ring->r_vec->irq_entry);
ca40feab
JK
2805}
2806
ac0488ef
JK
2807/**
2808 * nfp_net_set_config_and_enable() - Write control BAR and enable NFP
2809 * @nn: NFP Net device to reconfigure
2810 */
2811static int nfp_net_set_config_and_enable(struct nfp_net *nn)
1cd0cfc4 2812{
ee200a73 2813 u32 bufsz, new_ctrl, update = 0;
1cd0cfc4
JK
2814 unsigned int r;
2815 int err;
2816
79c12a75 2817 new_ctrl = nn->dp.ctrl;
1cd0cfc4 2818
611bdd49 2819 if (nn->dp.ctrl & NFP_NET_CFG_CTRL_RSS_ANY) {
1cd0cfc4
JK
2820 nfp_net_rss_write_key(nn);
2821 nfp_net_rss_write_itbl(nn);
2822 nn_writel(nn, NFP_NET_CFG_RSS_CTRL, nn->rss_cfg);
2823 update |= NFP_NET_CFG_UPDATE_RSS;
2824 }
2825
ad50451e 2826 if (nn->dp.ctrl & NFP_NET_CFG_CTRL_IRQMOD) {
1cd0cfc4 2827 nfp_net_coalesce_write_cfg(nn);
1cd0cfc4
JK
2828 update |= NFP_NET_CFG_UPDATE_IRQMOD;
2829 }
2830
79c12a75
JK
2831 for (r = 0; r < nn->dp.num_tx_rings; r++)
2832 nfp_net_tx_ring_hw_cfg_write(nn, &nn->dp.tx_rings[r], r);
2833 for (r = 0; r < nn->dp.num_rx_rings; r++)
2834 nfp_net_rx_ring_hw_cfg_write(nn, &nn->dp.rx_rings[r], r);
1cd0cfc4 2835
79c12a75
JK
2836 nn_writeq(nn, NFP_NET_CFG_TXRS_ENABLE, nn->dp.num_tx_rings == 64 ?
2837 0xffffffffffffffffULL : ((u64)1 << nn->dp.num_tx_rings) - 1);
1cd0cfc4 2838
79c12a75
JK
2839 nn_writeq(nn, NFP_NET_CFG_RXRS_ENABLE, nn->dp.num_rx_rings == 64 ?
2840 0xffffffffffffffffULL : ((u64)1 << nn->dp.num_rx_rings) - 1);
1cd0cfc4 2841
5c0dbe9e
JK
2842 if (nn->dp.netdev)
2843 nfp_net_write_mac_addr(nn, nn->dp.netdev->dev_addr);
1cd0cfc4 2844
5c0dbe9e 2845 nn_writel(nn, NFP_NET_CFG_MTU, nn->dp.mtu);
ee200a73
JK
2846
2847 bufsz = nn->dp.fl_bufsz - nn->dp.rx_dma_off - NFP_NET_RX_BUF_NON_DATA;
2848 nn_writel(nn, NFP_NET_CFG_FLBUFSZ, bufsz);
1cd0cfc4
JK
2849
2850 /* Enable device */
2851 new_ctrl |= NFP_NET_CFG_CTRL_ENABLE;
2852 update |= NFP_NET_CFG_UPDATE_GEN;
2853 update |= NFP_NET_CFG_UPDATE_MSIX;
2854 update |= NFP_NET_CFG_UPDATE_RING;
2855 if (nn->cap & NFP_NET_CFG_CTRL_RINGCFG)
2856 new_ctrl |= NFP_NET_CFG_CTRL_RINGCFG;
2857
2858 nn_writel(nn, NFP_NET_CFG_CTRL, new_ctrl);
2859 err = nfp_net_reconfig(nn, update);
ac0488ef
JK
2860 if (err) {
2861 nfp_net_clear_config_and_disable(nn);
2862 return err;
2863 }
1cd0cfc4 2864
79c12a75 2865 nn->dp.ctrl = new_ctrl;
1cd0cfc4 2866
79c12a75 2867 for (r = 0; r < nn->dp.num_rx_rings; r++)
6fe0c3b4 2868 nfp_net_rx_ring_fill_freelist(&nn->dp, &nn->dp.rx_rings[r]);
aba52df8 2869
ac0488ef 2870 return 0;
1cd0cfc4
JK
2871}
2872
d00ca2f3
JK
2873/**
2874 * nfp_net_close_stack() - Quiesce the stack (part of close)
2875 * @nn: NFP Net device to reconfigure
2876 */
2877static void nfp_net_close_stack(struct nfp_net *nn)
2878{
2879 unsigned int r;
2880
2881 disable_irq(nn->irq_entries[NFP_NET_IRQ_LSC_IDX].vector);
2882 netif_carrier_off(nn->dp.netdev);
2883 nn->link_up = false;
2884
2885 for (r = 0; r < nn->dp.num_r_vecs; r++) {
2886 disable_irq(nn->r_vecs[r].irq_vector);
2887 napi_disable(&nn->r_vecs[r].napi);
2888 }
2889
2890 netif_tx_disable(nn->dp.netdev);
2891}
2892
2893/**
2894 * nfp_net_close_free_all() - Free all runtime resources
2895 * @nn: NFP Net device to reconfigure
2896 */
2897static void nfp_net_close_free_all(struct nfp_net *nn)
2898{
2899 unsigned int r;
2900
4621199d
JK
2901 nfp_net_tx_rings_free(&nn->dp);
2902 nfp_net_rx_rings_free(&nn->dp);
2903
d00ca2f3
JK
2904 for (r = 0; r < nn->dp.num_r_vecs; r++)
2905 nfp_net_cleanup_vector(nn, &nn->r_vecs[r]);
2906
d00ca2f3
JK
2907 nfp_net_aux_irq_free(nn, NFP_NET_CFG_LSC, NFP_NET_IRQ_LSC_IDX);
2908 nfp_net_aux_irq_free(nn, NFP_NET_CFG_EXN, NFP_NET_IRQ_EXN_IDX);
2909}
2910
2911/**
2912 * nfp_net_netdev_close() - Called when the device is downed
2913 * @netdev: netdev structure
2914 */
2915static int nfp_net_netdev_close(struct net_device *netdev)
2916{
2917 struct nfp_net *nn = netdev_priv(netdev);
2918
2919 /* Step 1: Disable RX and TX rings from the Linux kernel perspective
2920 */
2921 nfp_net_close_stack(nn);
2922
2923 /* Step 2: Tell NFP
2924 */
2925 nfp_net_clear_config_and_disable(nn);
447e9ebf 2926 nfp_port_configure(netdev, false);
d00ca2f3
JK
2927
2928 /* Step 3: Free resources
2929 */
2930 nfp_net_close_free_all(nn);
2931
2932 nn_dbg(nn, "%s down", netdev->name);
2933 return 0;
2934}
2935
77ece8d5
JK
2936void nfp_ctrl_close(struct nfp_net *nn)
2937{
2938 int r;
2939
2940 rtnl_lock();
2941
2942 for (r = 0; r < nn->dp.num_r_vecs; r++) {
2943 disable_irq(nn->r_vecs[r].irq_vector);
2944 tasklet_disable(&nn->r_vecs[r].tasklet);
2945 }
2946
2947 nfp_net_clear_config_and_disable(nn);
2948
2949 nfp_net_close_free_all(nn);
2950
2951 rtnl_unlock();
2952}
2953
1cd0cfc4
JK
2954/**
2955 * nfp_net_open_stack() - Start the device from stack's perspective
2956 * @nn: NFP Net device to reconfigure
2957 */
2958static void nfp_net_open_stack(struct nfp_net *nn)
2959{
2960 unsigned int r;
2961
79c12a75 2962 for (r = 0; r < nn->dp.num_r_vecs; r++) {
aba52df8 2963 napi_enable(&nn->r_vecs[r].napi);
fdace6c2 2964 enable_irq(nn->r_vecs[r].irq_vector);
aba52df8 2965 }
1cd0cfc4 2966
79c12a75 2967 netif_tx_wake_all_queues(nn->dp.netdev);
1cd0cfc4 2968
ce449ba7 2969 enable_irq(nn->irq_entries[NFP_NET_IRQ_LSC_IDX].vector);
1cd0cfc4
JK
2970 nfp_net_read_link_status(nn);
2971}
2972
ee26756d 2973static int nfp_net_open_alloc_all(struct nfp_net *nn)
4c352362 2974{
4c352362 2975 int err, r;
4c352362 2976
4c352362
JK
2977 err = nfp_net_aux_irq_request(nn, NFP_NET_CFG_EXN, "%s-exn",
2978 nn->exn_name, sizeof(nn->exn_name),
2979 NFP_NET_IRQ_EXN_IDX, nn->exn_handler);
2980 if (err)
2981 return err;
0ba40af9
JK
2982 err = nfp_net_aux_irq_request(nn, NFP_NET_CFG_LSC, "%s-lsc",
2983 nn->lsc_name, sizeof(nn->lsc_name),
2984 NFP_NET_IRQ_LSC_IDX, nn->lsc_handler);
2985 if (err)
2986 goto err_free_exn;
ce449ba7 2987 disable_irq(nn->irq_entries[NFP_NET_IRQ_LSC_IDX].vector);
4c352362 2988
79c12a75 2989 for (r = 0; r < nn->dp.num_r_vecs; r++) {
0afbfb18
JK
2990 err = nfp_net_prepare_vector(nn, &nn->r_vecs[r], r);
2991 if (err)
cbeaf7aa
JK
2992 goto err_cleanup_vec_p;
2993 }
a10b563d 2994
892a7f70
JK
2995 err = nfp_net_rx_rings_prepare(nn, &nn->dp);
2996 if (err)
a10b563d 2997 goto err_cleanup_vec;
114bdef0 2998
892a7f70
JK
2999 err = nfp_net_tx_rings_prepare(nn, &nn->dp);
3000 if (err)
a10b563d 3001 goto err_free_rx_rings;
4c352362 3002
e31230f9 3003 for (r = 0; r < nn->max_r_vecs; r++)
79c12a75 3004 nfp_net_vector_assign_rings(&nn->dp, &nn->r_vecs[r], r);
e31230f9 3005
ee26756d
JK
3006 return 0;
3007
3008err_free_rx_rings:
3009 nfp_net_rx_rings_free(&nn->dp);
3010err_cleanup_vec:
3011 r = nn->dp.num_r_vecs;
3012err_cleanup_vec_p:
3013 while (r--)
3014 nfp_net_cleanup_vector(nn, &nn->r_vecs[r]);
3015 nfp_net_aux_irq_free(nn, NFP_NET_CFG_LSC, NFP_NET_IRQ_LSC_IDX);
3016err_free_exn:
3017 nfp_net_aux_irq_free(nn, NFP_NET_CFG_EXN, NFP_NET_IRQ_EXN_IDX);
3018 return err;
3019}
3020
3021static int nfp_net_netdev_open(struct net_device *netdev)
3022{
3023 struct nfp_net *nn = netdev_priv(netdev);
3024 int err;
3025
3026 /* Step 1: Allocate resources for rings and the like
3027 * - Request interrupts
3028 * - Allocate RX and TX ring resources
3029 * - Setup initial RSS table
3030 */
3031 err = nfp_net_open_alloc_all(nn);
3032 if (err)
3033 return err;
3034
79c12a75 3035 err = netif_set_real_num_tx_queues(netdev, nn->dp.num_stack_tx_rings);
4c352362 3036 if (err)
ee26756d 3037 goto err_free_all;
4c352362 3038
79c12a75 3039 err = netif_set_real_num_rx_queues(netdev, nn->dp.num_rx_rings);
4c352362 3040 if (err)
ee26756d 3041 goto err_free_all;
4c352362 3042
4c352362 3043 /* Step 2: Configure the NFP
447e9ebf 3044 * - Ifup the physical interface if it exists
4c352362
JK
3045 * - Enable rings from 0 to tx_rings/rx_rings - 1.
3046 * - Write MAC address (in case it changed)
3047 * - Set the MTU
3048 * - Set the Freelist buffer size
3049 * - Enable the FW
3050 */
447e9ebf 3051 err = nfp_port_configure(netdev, true);
4c352362 3052 if (err)
ee26756d 3053 goto err_free_all;
4c352362 3054
447e9ebf
DM
3055 err = nfp_net_set_config_and_enable(nn);
3056 if (err)
3057 goto err_port_disable;
3058
4c352362
JK
3059 /* Step 3: Enable for kernel
3060 * - put some freelist descriptors on each RX ring
3061 * - enable NAPI on each ring
3062 * - enable all TX queues
3063 * - set link state
3064 */
1cd0cfc4 3065 nfp_net_open_stack(nn);
4c352362
JK
3066
3067 return 0;
3068
447e9ebf
DM
3069err_port_disable:
3070 nfp_port_configure(netdev, false);
ee26756d
JK
3071err_free_all:
3072 nfp_net_close_free_all(nn);
4c352362
JK
3073 return err;
3074}
3075
77ece8d5
JK
3076int nfp_ctrl_open(struct nfp_net *nn)
3077{
3078 int err, r;
3079
3080 /* ring dumping depends on vNICs being opened/closed under rtnl */
3081 rtnl_lock();
3082
3083 err = nfp_net_open_alloc_all(nn);
3084 if (err)
3085 goto err_unlock;
3086
3087 err = nfp_net_set_config_and_enable(nn);
3088 if (err)
3089 goto err_free_all;
3090
3091 for (r = 0; r < nn->dp.num_r_vecs; r++)
3092 enable_irq(nn->r_vecs[r].irq_vector);
3093
3094 rtnl_unlock();
3095
3096 return 0;
3097
3098err_free_all:
3099 nfp_net_close_free_all(nn);
3100err_unlock:
3101 rtnl_unlock();
3102 return err;
3103}
3104
4c352362
JK
3105static void nfp_net_set_rx_mode(struct net_device *netdev)
3106{
3107 struct nfp_net *nn = netdev_priv(netdev);
3108 u32 new_ctrl;
3109
79c12a75 3110 new_ctrl = nn->dp.ctrl;
4c352362 3111
d0adb51e
JK
3112 if (!netdev_mc_empty(netdev) || netdev->flags & IFF_ALLMULTI)
3113 new_ctrl |= nn->cap & NFP_NET_CFG_CTRL_L2MC;
3114 else
3115 new_ctrl &= ~NFP_NET_CFG_CTRL_L2MC;
3116
4c352362
JK
3117 if (netdev->flags & IFF_PROMISC) {
3118 if (nn->cap & NFP_NET_CFG_CTRL_PROMISC)
3119 new_ctrl |= NFP_NET_CFG_CTRL_PROMISC;
3120 else
3121 nn_warn(nn, "FW does not support promiscuous mode\n");
3122 } else {
3123 new_ctrl &= ~NFP_NET_CFG_CTRL_PROMISC;
3124 }
3125
79c12a75 3126 if (new_ctrl == nn->dp.ctrl)
4c352362
JK
3127 return;
3128
3129 nn_writel(nn, NFP_NET_CFG_CTRL, new_ctrl);
3d780b92 3130 nfp_net_reconfig_post(nn, NFP_NET_CFG_UPDATE_GEN);
4c352362 3131
79c12a75 3132 nn->dp.ctrl = new_ctrl;
4c352362
JK
3133}
3134
1e9e10d0
JK
3135static void nfp_net_rss_init_itbl(struct nfp_net *nn)
3136{
3137 int i;
3138
3139 for (i = 0; i < sizeof(nn->rss_itbl); i++)
3140 nn->rss_itbl[i] =
79c12a75 3141 ethtool_rxfh_indir_default(i, nn->dp.num_rx_rings);
1e9e10d0
JK
3142}
3143
512e94dc
JK
3144static void nfp_net_dp_swap(struct nfp_net *nn, struct nfp_net_dp *dp)
3145{
3146 struct nfp_net_dp new_dp = *dp;
3147
3148 *dp = nn->dp;
3149 nn->dp = new_dp;
76e1e1a8
JK
3150
3151 nn->dp.netdev->mtu = new_dp.mtu;
892a7f70
JK
3152
3153 if (!netif_is_rxfh_configured(nn->dp.netdev))
3154 nfp_net_rss_init_itbl(nn);
512e94dc
JK
3155}
3156
892a7f70 3157static int nfp_net_dp_swap_enable(struct nfp_net *nn, struct nfp_net_dp *dp)
4c352362 3158{
e31230f9 3159 unsigned int r;
164d1e9e 3160 int err;
e31230f9 3161
892a7f70 3162 nfp_net_dp_swap(nn, dp);
164d1e9e 3163
e31230f9 3164 for (r = 0; r < nn->max_r_vecs; r++)
79c12a75 3165 nfp_net_vector_assign_rings(&nn->dp, &nn->r_vecs[r], r);
e31230f9 3166
79c12a75 3167 err = netif_set_real_num_rx_queues(nn->dp.netdev, nn->dp.num_rx_rings);
08348995
AB
3168 if (err)
3169 return err;
164d1e9e 3170
79c12a75
JK
3171 if (nn->dp.netdev->real_num_tx_queues != nn->dp.num_stack_tx_rings) {
3172 err = netif_set_real_num_tx_queues(nn->dp.netdev,
3173 nn->dp.num_stack_tx_rings);
164d1e9e
JK
3174 if (err)
3175 return err;
3176 }
3177
ac0488ef 3178 return nfp_net_set_config_and_enable(nn);
68453c7a 3179}
36a857e4 3180
783496b0
JK
3181struct nfp_net_dp *nfp_net_clone_dp(struct nfp_net *nn)
3182{
3183 struct nfp_net_dp *new;
3184
3185 new = kmalloc(sizeof(*new), GFP_KERNEL);
3186 if (!new)
3187 return NULL;
3188
3189 *new = nn->dp;
3190
3191 /* Clear things which need to be recomputed */
3192 new->fl_bufsz = 0;
3193 new->tx_rings = NULL;
3194 new->rx_rings = NULL;
3195 new->num_r_vecs = 0;
3196 new->num_stack_tx_rings = 0;
3197
3198 return new;
3199}
3200
d957c0f7
JK
3201static int
3202nfp_net_check_config(struct nfp_net *nn, struct nfp_net_dp *dp,
3203 struct netlink_ext_ack *extack)
ecd63a02
JK
3204{
3205 /* XDP-enabled tests */
9dc6b116 3206 if (!dp->xdp_prog)
ecd63a02 3207 return 0;
2195c263 3208 if (dp->fl_bufsz > PAGE_SIZE) {
4d463c4d 3209 NL_SET_ERR_MSG_MOD(extack, "MTU too large w/ XDP enabled");
ecd63a02
JK
3210 return -EINVAL;
3211 }
892a7f70 3212 if (dp->num_tx_rings > nn->max_tx_rings) {
4d463c4d 3213 NL_SET_ERR_MSG_MOD(extack, "Insufficient number of TX rings w/ XDP enabled");
ecd63a02
JK
3214 return -EINVAL;
3215 }
3216
3217 return 0;
3218}
3219
d957c0f7
JK
3220int nfp_net_ring_reconfig(struct nfp_net *nn, struct nfp_net_dp *dp,
3221 struct netlink_ext_ack *extack)
cc7c0333 3222{
512e94dc 3223 int r, err;
cc7c0333 3224
76e1e1a8 3225 dp->fl_bufsz = nfp_net_calc_fl_bufsz(dp);
2195c263 3226
892a7f70 3227 dp->num_stack_tx_rings = dp->num_tx_rings;
9dc6b116 3228 if (dp->xdp_prog)
892a7f70 3229 dp->num_stack_tx_rings -= dp->num_rx_rings;
ecd63a02 3230
892a7f70 3231 dp->num_r_vecs = max(dp->num_rx_rings, dp->num_stack_tx_rings);
ecd63a02 3232
d957c0f7 3233 err = nfp_net_check_config(nn, dp, extack);
ecd63a02 3234 if (err)
783496b0 3235 goto exit_free_dp;
164d1e9e 3236
783496b0 3237 if (!netif_running(dp->netdev)) {
892a7f70 3238 nfp_net_dp_swap(nn, dp);
783496b0
JK
3239 err = 0;
3240 goto exit_free_dp;
cc7c0333
JK
3241 }
3242
cc7c0333 3243 /* Prepare new rings */
512e94dc 3244 for (r = nn->dp.num_r_vecs; r < dp->num_r_vecs; r++) {
164d1e9e
JK
3245 err = nfp_net_prepare_vector(nn, &nn->r_vecs[r], r);
3246 if (err) {
512e94dc 3247 dp->num_r_vecs = r;
164d1e9e
JK
3248 goto err_cleanup_vecs;
3249 }
3250 }
892a7f70
JK
3251
3252 err = nfp_net_rx_rings_prepare(nn, dp);
3253 if (err)
3254 goto err_cleanup_vecs;
3255
3256 err = nfp_net_tx_rings_prepare(nn, dp);
3257 if (err)
3258 goto err_free_rx;
cc7c0333
JK
3259
3260 /* Stop device, swap in new rings, try to start the firmware */
3261 nfp_net_close_stack(nn);
3262 nfp_net_clear_config_and_disable(nn);
3263
892a7f70 3264 err = nfp_net_dp_swap_enable(nn, dp);
cc7c0333 3265 if (err) {
68453c7a 3266 int err2;
cc7c0333 3267
68453c7a 3268 nfp_net_clear_config_and_disable(nn);
cc7c0333 3269
68453c7a 3270 /* Try with old configuration and old rings */
892a7f70 3271 err2 = nfp_net_dp_swap_enable(nn, dp);
68453c7a 3272 if (err2)
cc7c0333 3273 nn_err(nn, "Can't restore ring config - FW communication failed (%d,%d)\n",
68453c7a 3274 err, err2);
cc7c0333 3275 }
512e94dc 3276 for (r = dp->num_r_vecs - 1; r >= nn->dp.num_r_vecs; r--)
164d1e9e 3277 nfp_net_cleanup_vector(nn, &nn->r_vecs[r]);
cc7c0333 3278
892a7f70
JK
3279 nfp_net_rx_rings_free(dp);
3280 nfp_net_tx_rings_free(dp);
cc7c0333
JK
3281
3282 nfp_net_open_stack(nn);
783496b0
JK
3283exit_free_dp:
3284 kfree(dp);
cc7c0333
JK
3285
3286 return err;
68453c7a
JK
3287
3288err_free_rx:
892a7f70 3289 nfp_net_rx_rings_free(dp);
164d1e9e 3290err_cleanup_vecs:
512e94dc 3291 for (r = dp->num_r_vecs - 1; r >= nn->dp.num_r_vecs; r--)
164d1e9e 3292 nfp_net_cleanup_vector(nn, &nn->r_vecs[r]);
783496b0 3293 kfree(dp);
68453c7a
JK
3294 return err;
3295}
3296
3297static int nfp_net_change_mtu(struct net_device *netdev, int new_mtu)
3298{
3299 struct nfp_net *nn = netdev_priv(netdev);
783496b0 3300 struct nfp_net_dp *dp;
ccbdc596
JK
3301 int err;
3302
167cebef 3303 err = nfp_app_check_mtu(nn->app, netdev, new_mtu);
ccbdc596
JK
3304 if (err)
3305 return err;
783496b0
JK
3306
3307 dp = nfp_net_clone_dp(nn);
3308 if (!dp)
3309 return -ENOMEM;
68453c7a 3310
76e1e1a8
JK
3311 dp->mtu = new_mtu;
3312
d957c0f7 3313 return nfp_net_ring_reconfig(nn, dp, NULL);
cc7c0333
JK
3314}
3315
b64052fc
PC
3316static int
3317nfp_net_vlan_rx_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
3318{
dd5b2498 3319 const u32 cmd = NFP_NET_CFG_MBOX_CMD_CTAG_FILTER_ADD;
b64052fc 3320 struct nfp_net *nn = netdev_priv(netdev);
dd5b2498 3321 int err;
b64052fc
PC
3322
3323 /* Priority tagged packets with vlan id 0 are processed by the
3324 * NFP as untagged packets
3325 */
3326 if (!vid)
3327 return 0;
3328
dd5b2498
JK
3329 err = nfp_net_mbox_lock(nn, NFP_NET_CFG_VLAN_FILTER_SZ);
3330 if (err)
3331 return err;
3332
527d7d1b
JK
3333 nn_writew(nn, nn->tlv_caps.mbox_off + NFP_NET_CFG_VLAN_FILTER_VID, vid);
3334 nn_writew(nn, nn->tlv_caps.mbox_off + NFP_NET_CFG_VLAN_FILTER_PROTO,
3335 ETH_P_8021Q);
b64052fc 3336
dd5b2498 3337 return nfp_net_mbox_reconfig_and_unlock(nn, cmd);
b64052fc
PC
3338}
3339
3340static int
3341nfp_net_vlan_rx_kill_vid(struct net_device *netdev, __be16 proto, u16 vid)
3342{
dd5b2498 3343 const u32 cmd = NFP_NET_CFG_MBOX_CMD_CTAG_FILTER_KILL;
b64052fc 3344 struct nfp_net *nn = netdev_priv(netdev);
dd5b2498 3345 int err;
b64052fc
PC
3346
3347 /* Priority tagged packets with vlan id 0 are processed by the
3348 * NFP as untagged packets
3349 */
3350 if (!vid)
3351 return 0;
3352
dd5b2498
JK
3353 err = nfp_net_mbox_lock(nn, NFP_NET_CFG_VLAN_FILTER_SZ);
3354 if (err)
3355 return err;
3356
527d7d1b
JK
3357 nn_writew(nn, nn->tlv_caps.mbox_off + NFP_NET_CFG_VLAN_FILTER_VID, vid);
3358 nn_writew(nn, nn->tlv_caps.mbox_off + NFP_NET_CFG_VLAN_FILTER_PROTO,
3359 ETH_P_8021Q);
b64052fc 3360
dd5b2498 3361 return nfp_net_mbox_reconfig_and_unlock(nn, cmd);
b64052fc
PC
3362}
3363
bc1f4470 3364static void nfp_net_stat64(struct net_device *netdev,
3365 struct rtnl_link_stats64 *stats)
4c352362
JK
3366{
3367 struct nfp_net *nn = netdev_priv(netdev);
3368 int r;
3369
eca09be8 3370 /* Collect software stats */
29f534c4 3371 for (r = 0; r < nn->max_r_vecs; r++) {
4c352362
JK
3372 struct nfp_net_r_vector *r_vec = &nn->r_vecs[r];
3373 u64 data[3];
3374 unsigned int start;
3375
3376 do {
3377 start = u64_stats_fetch_begin(&r_vec->rx_sync);
3378 data[0] = r_vec->rx_pkts;
3379 data[1] = r_vec->rx_bytes;
3380 data[2] = r_vec->rx_drops;
3381 } while (u64_stats_fetch_retry(&r_vec->rx_sync, start));
3382 stats->rx_packets += data[0];
3383 stats->rx_bytes += data[1];
3384 stats->rx_dropped += data[2];
3385
3386 do {
3387 start = u64_stats_fetch_begin(&r_vec->tx_sync);
3388 data[0] = r_vec->tx_pkts;
3389 data[1] = r_vec->tx_bytes;
3390 data[2] = r_vec->tx_errors;
3391 } while (u64_stats_fetch_retry(&r_vec->tx_sync, start));
3392 stats->tx_packets += data[0];
3393 stats->tx_bytes += data[1];
3394 stats->tx_errors += data[2];
3395 }
eca09be8
JK
3396
3397 /* Add in device stats */
3398 stats->multicast += nn_readq(nn, NFP_NET_CFG_STATS_RX_MC_FRAMES);
3399 stats->rx_dropped += nn_readq(nn, NFP_NET_CFG_STATS_RX_DISCARDS);
3400 stats->rx_errors += nn_readq(nn, NFP_NET_CFG_STATS_RX_ERRORS);
3401
3402 stats->tx_dropped += nn_readq(nn, NFP_NET_CFG_STATS_TX_DISCARDS);
3403 stats->tx_errors += nn_readq(nn, NFP_NET_CFG_STATS_TX_ERRORS);
4c352362
JK
3404}
3405
3406static int nfp_net_set_features(struct net_device *netdev,
3407 netdev_features_t features)
3408{
3409 netdev_features_t changed = netdev->features ^ features;
3410 struct nfp_net *nn = netdev_priv(netdev);
3411 u32 new_ctrl;
3412 int err;
3413
3414 /* Assume this is not called with features we have not advertised */
3415
79c12a75 3416 new_ctrl = nn->dp.ctrl;
4c352362
JK
3417
3418 if (changed & NETIF_F_RXCSUM) {
3419 if (features & NETIF_F_RXCSUM)
ddb98d94 3420 new_ctrl |= nn->cap & NFP_NET_CFG_CTRL_RXCSUM_ANY;
4c352362 3421 else
ddb98d94 3422 new_ctrl &= ~NFP_NET_CFG_CTRL_RXCSUM_ANY;
4c352362
JK
3423 }
3424
3425 if (changed & (NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM)) {
3426 if (features & (NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM))
3427 new_ctrl |= NFP_NET_CFG_CTRL_TXCSUM;
3428 else
3429 new_ctrl &= ~NFP_NET_CFG_CTRL_TXCSUM;
3430 }
3431
3432 if (changed & (NETIF_F_TSO | NETIF_F_TSO6)) {
3433 if (features & (NETIF_F_TSO | NETIF_F_TSO6))
28063be6
EP
3434 new_ctrl |= nn->cap & NFP_NET_CFG_CTRL_LSO2 ?:
3435 NFP_NET_CFG_CTRL_LSO;
4c352362 3436 else
28063be6 3437 new_ctrl &= ~NFP_NET_CFG_CTRL_LSO_ANY;
4c352362
JK
3438 }
3439
3440 if (changed & NETIF_F_HW_VLAN_CTAG_RX) {
3441 if (features & NETIF_F_HW_VLAN_CTAG_RX)
3442 new_ctrl |= NFP_NET_CFG_CTRL_RXVLAN;
3443 else
3444 new_ctrl &= ~NFP_NET_CFG_CTRL_RXVLAN;
3445 }
3446
3447 if (changed & NETIF_F_HW_VLAN_CTAG_TX) {
3448 if (features & NETIF_F_HW_VLAN_CTAG_TX)
3449 new_ctrl |= NFP_NET_CFG_CTRL_TXVLAN;
3450 else
3451 new_ctrl &= ~NFP_NET_CFG_CTRL_TXVLAN;
3452 }
3453
b64052fc
PC
3454 if (changed & NETIF_F_HW_VLAN_CTAG_FILTER) {
3455 if (features & NETIF_F_HW_VLAN_CTAG_FILTER)
3456 new_ctrl |= NFP_NET_CFG_CTRL_CTAG_FILTER;
3457 else
3458 new_ctrl &= ~NFP_NET_CFG_CTRL_CTAG_FILTER;
3459 }
3460
4c352362
JK
3461 if (changed & NETIF_F_SG) {
3462 if (features & NETIF_F_SG)
3463 new_ctrl |= NFP_NET_CFG_CTRL_GATHER;
3464 else
3465 new_ctrl &= ~NFP_NET_CFG_CTRL_GATHER;
3466 }
3467
d692403e
JK
3468 err = nfp_port_set_features(netdev, features);
3469 if (err)
3470 return err;
7533fdc0 3471
4c352362
JK
3472 nn_dbg(nn, "Feature change 0x%llx -> 0x%llx (changed=0x%llx)\n",
3473 netdev->features, features, changed);
3474
79c12a75 3475 if (new_ctrl == nn->dp.ctrl)
4c352362
JK
3476 return 0;
3477
79c12a75 3478 nn_dbg(nn, "NIC ctrl: 0x%x -> 0x%x\n", nn->dp.ctrl, new_ctrl);
4c352362
JK
3479 nn_writel(nn, NFP_NET_CFG_CTRL, new_ctrl);
3480 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN);
3481 if (err)
3482 return err;
3483
79c12a75 3484 nn->dp.ctrl = new_ctrl;
4c352362
JK
3485
3486 return 0;
3487}
3488
3489static netdev_features_t
3490nfp_net_features_check(struct sk_buff *skb, struct net_device *dev,
3491 netdev_features_t features)
3492{
3493 u8 l4_hdr;
3494
3495 /* We can't do TSO over double tagged packets (802.1AD) */
3496 features &= vlan_features_check(skb, features);
3497
3498 if (!skb->encapsulation)
3499 return features;
3500
3501 /* Ensure that inner L4 header offset fits into TX descriptor field */
3502 if (skb_is_gso(skb)) {
3503 u32 hdrlen;
3504
3505 hdrlen = skb_inner_transport_header(skb) - skb->data +
3506 inner_tcp_hdrlen(skb);
3507
d7cc8252
JK
3508 /* Assume worst case scenario of having longest possible
3509 * metadata prepend - 8B
3510 */
3511 if (unlikely(hdrlen > NFP_NET_LSO_MAX_HDR_SZ - 8))
4c352362
JK
3512 features &= ~NETIF_F_GSO_MASK;
3513 }
3514
3515 /* VXLAN/GRE check */
3516 switch (vlan_get_protocol(skb)) {
3517 case htons(ETH_P_IP):
3518 l4_hdr = ip_hdr(skb)->protocol;
3519 break;
3520 case htons(ETH_P_IPV6):
3521 l4_hdr = ipv6_hdr(skb)->nexthdr;
3522 break;
3523 default:
a188222b 3524 return features & ~(NETIF_F_CSUM_MASK | NETIF_F_GSO_MASK);
4c352362
JK
3525 }
3526
3527 if (skb->inner_protocol_type != ENCAP_TYPE_ETHER ||
3528 skb->inner_protocol != htons(ETH_P_TEB) ||
3529 (l4_hdr != IPPROTO_UDP && l4_hdr != IPPROTO_GRE) ||
3530 (l4_hdr == IPPROTO_UDP &&
3531 (skb_inner_mac_header(skb) - skb_transport_header(skb) !=
3532 sizeof(struct udphdr) + sizeof(struct vxlanhdr))))
a188222b 3533 return features & ~(NETIF_F_CSUM_MASK | NETIF_F_GSO_MASK);
4c352362
JK
3534
3535 return features;
3536}
3537
51c1df83
JK
3538static int
3539nfp_net_get_phys_port_name(struct net_device *netdev, char *name, size_t len)
3540{
3541 struct nfp_net *nn = netdev_priv(netdev);
3542 int n;
3543
f1fa719c
JP
3544 /* If port is defined, devlink_port is registered and devlink core
3545 * is taking care of name formatting.
3546 */
51c1df83 3547 if (nn->port)
f1fa719c 3548 return -EOPNOTSUPP;
51c1df83 3549
fe06a64e 3550 if (nn->dp.is_vf || nn->vnic_no_name)
6fd1cfc0
JK
3551 return -EOPNOTSUPP;
3552
ca145732 3553 n = snprintf(name, len, "n%d", nn->id);
6fd1cfc0
JK
3554 if (n >= len)
3555 return -EINVAL;
51c1df83
JK
3556
3557 return 0;
3558}
3559
5f428401 3560static int nfp_net_xdp_setup_drv(struct nfp_net *nn, struct netdev_bpf *bpf)
ecd63a02 3561{
5f428401 3562 struct bpf_prog *prog = bpf->prog;
783496b0 3563 struct nfp_net_dp *dp;
5f428401
JK
3564 int err;
3565
3566 if (!xdp_attachment_flags_ok(&nn->xdp, bpf))
3567 return -EBUSY;
ecd63a02 3568
6a8ef542
JK
3569 if (!prog == !nn->dp.xdp_prog) {
3570 WRITE_ONCE(nn->dp.xdp_prog, prog);
5f428401 3571 xdp_attachment_setup(&nn->xdp, bpf);
ecd63a02
JK
3572 return 0;
3573 }
3574
783496b0
JK
3575 dp = nfp_net_clone_dp(nn);
3576 if (!dp)
3577 return -ENOMEM;
3578
9dc6b116 3579 dp->xdp_prog = prog;
892a7f70 3580 dp->num_tx_rings += prog ? nn->dp.num_rx_rings : -nn->dp.num_rx_rings;
c487e6b1 3581 dp->rx_dma_dir = prog ? DMA_BIDIRECTIONAL : DMA_FROM_DEVICE;
dbf637ff 3582 dp->rx_dma_off = prog ? XDP_PACKET_HEADROOM - nn->dp.rx_offset : 0;
ecd63a02
JK
3583
3584 /* We need RX reconfig to remap the buffers (BIDIR vs FROM_DEV) */
5f428401
JK
3585 err = nfp_net_ring_reconfig(nn, dp, bpf->extack);
3586 if (err)
3587 return err;
3588
3589 xdp_attachment_setup(&nn->xdp, bpf);
3590 return 0;
c443b5ac
JK
3591}
3592
5f428401 3593static int nfp_net_xdp_setup_hw(struct nfp_net *nn, struct netdev_bpf *bpf)
c443b5ac
JK
3594{
3595 int err;
3596
5f428401 3597 if (!xdp_attachment_flags_ok(&nn->xdp_hw, bpf))
9f82fca9
JK
3598 return -EBUSY;
3599
5f428401 3600 err = nfp_app_xdp_offload(nn->app, nn, bpf->prog, bpf->extack);
c443b5ac
JK
3601 if (err)
3602 return err;
3603
5f428401 3604 xdp_attachment_setup(&nn->xdp_hw, bpf);
ecd63a02
JK
3605 return 0;
3606}
3607
f4e63525 3608static int nfp_net_xdp(struct net_device *netdev, struct netdev_bpf *xdp)
ecd63a02
JK
3609{
3610 struct nfp_net *nn = netdev_priv(netdev);
3611
3612 switch (xdp->command) {
3613 case XDP_SETUP_PROG:
5f428401 3614 return nfp_net_xdp_setup_drv(nn, xdp);
cafa92ac 3615 case XDP_SETUP_PROG_HW:
5f428401 3616 return nfp_net_xdp_setup_hw(nn, xdp);
ecd63a02 3617 default:
af93d15a 3618 return nfp_app_bpf(nn->app, nn, xdp);
ecd63a02
JK
3619 }
3620}
3621
9d372759
PC
3622static int nfp_net_set_mac_address(struct net_device *netdev, void *addr)
3623{
3624 struct nfp_net *nn = netdev_priv(netdev);
3625 struct sockaddr *saddr = addr;
3626 int err;
3627
3628 err = eth_prepare_mac_addr_change(netdev, addr);
3629 if (err)
3630 return err;
3631
3632 nfp_net_write_mac_addr(nn, saddr->sa_data);
3633
3634 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_MACADDR);
3635 if (err)
3636 return err;
3637
3638 eth_commit_mac_addr_change(netdev, addr);
3639
3640 return 0;
3641}
3642
eb488c26 3643const struct net_device_ops nfp_net_netdev_ops = {
4612bebf
JK
3644 .ndo_init = nfp_app_ndo_init,
3645 .ndo_uninit = nfp_app_ndo_uninit,
4c352362
JK
3646 .ndo_open = nfp_net_netdev_open,
3647 .ndo_stop = nfp_net_netdev_close,
3648 .ndo_start_xmit = nfp_net_tx,
3649 .ndo_get_stats64 = nfp_net_stat64,
b64052fc
PC
3650 .ndo_vlan_rx_add_vid = nfp_net_vlan_rx_add_vid,
3651 .ndo_vlan_rx_kill_vid = nfp_net_vlan_rx_kill_vid,
25528d90
PC
3652 .ndo_set_vf_mac = nfp_app_set_vf_mac,
3653 .ndo_set_vf_vlan = nfp_app_set_vf_vlan,
3654 .ndo_set_vf_spoofchk = nfp_app_set_vf_spoofchk,
4ef6cbe8 3655 .ndo_set_vf_trust = nfp_app_set_vf_trust,
25528d90
PC
3656 .ndo_get_vf_config = nfp_app_get_vf_config,
3657 .ndo_set_vf_link_state = nfp_app_set_vf_link_state,
8a276873 3658 .ndo_setup_tc = nfp_port_setup_tc,
4c352362
JK
3659 .ndo_tx_timeout = nfp_net_tx_timeout,
3660 .ndo_set_rx_mode = nfp_net_set_rx_mode,
3661 .ndo_change_mtu = nfp_net_change_mtu,
9d372759 3662 .ndo_set_mac_address = nfp_net_set_mac_address,
4c352362
JK
3663 .ndo_set_features = nfp_net_set_features,
3664 .ndo_features_check = nfp_net_features_check,
51c1df83 3665 .ndo_get_phys_port_name = nfp_net_get_phys_port_name,
641ca085
JK
3666 .ndo_udp_tunnel_add = udp_tunnel_nic_add_port,
3667 .ndo_udp_tunnel_del = udp_tunnel_nic_del_port,
f4e63525 3668 .ndo_bpf = nfp_net_xdp,
5dc37bb9 3669 .ndo_get_devlink_port = nfp_devlink_get_devlink_port,
4c352362
JK
3670};
3671
641ca085
JK
3672static int nfp_udp_tunnel_sync(struct net_device *netdev, unsigned int table)
3673{
3674 struct nfp_net *nn = netdev_priv(netdev);
3675 int i;
3676
3677 BUILD_BUG_ON(NFP_NET_N_VXLAN_PORTS & 1);
3678 for (i = 0; i < NFP_NET_N_VXLAN_PORTS; i += 2) {
3679 struct udp_tunnel_info ti0, ti1;
3680
3681 udp_tunnel_nic_get_port(netdev, table, i, &ti0);
3682 udp_tunnel_nic_get_port(netdev, table, i + 1, &ti1);
3683
3684 nn_writel(nn, NFP_NET_CFG_VXLAN_PORT + i * sizeof(ti0.port),
3685 be16_to_cpu(ti1.port) << 16 | be16_to_cpu(ti0.port));
3686 }
3687
3688 return nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_VXLAN);
3689}
3690
3691static const struct udp_tunnel_nic_info nfp_udp_tunnels = {
3692 .sync_table = nfp_udp_tunnel_sync,
3693 .flags = UDP_TUNNEL_NIC_INFO_MAY_SLEEP |
3694 UDP_TUNNEL_NIC_INFO_OPEN_ONLY,
3695 .tables = {
3696 {
3697 .n_entries = NFP_NET_N_VXLAN_PORTS,
3698 .tunnel_types = UDP_TUNNEL_TYPE_VXLAN,
3699 },
3700 },
3701};
3702
4c352362
JK
3703/**
3704 * nfp_net_info() - Print general info about the NIC
3705 * @nn: NFP Net device to reconfigure
3706 */
3707void nfp_net_info(struct nfp_net *nn)
3708{
416db5c1 3709 nn_info(nn, "Netronome NFP-6xxx %sNetdev: TxQs=%d/%d RxQs=%d/%d\n",
79c12a75
JK
3710 nn->dp.is_vf ? "VF " : "",
3711 nn->dp.num_tx_rings, nn->max_tx_rings,
3712 nn->dp.num_rx_rings, nn->max_rx_rings);
4c352362
JK
3713 nn_info(nn, "VER: %d.%d.%d.%d, Maximum supported MTU: %d\n",
3714 nn->fw_ver.resv, nn->fw_ver.class,
3715 nn->fw_ver.major, nn->fw_ver.minor,
3716 nn->max_mtu);
31f1a0e3 3717 nn_info(nn, "CAP: %#x %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s\n",
4c352362
JK
3718 nn->cap,
3719 nn->cap & NFP_NET_CFG_CTRL_PROMISC ? "PROMISC " : "",
3720 nn->cap & NFP_NET_CFG_CTRL_L2BC ? "L2BCFILT " : "",
3721 nn->cap & NFP_NET_CFG_CTRL_L2MC ? "L2MCFILT " : "",
3722 nn->cap & NFP_NET_CFG_CTRL_RXCSUM ? "RXCSUM " : "",
3723 nn->cap & NFP_NET_CFG_CTRL_TXCSUM ? "TXCSUM " : "",
3724 nn->cap & NFP_NET_CFG_CTRL_RXVLAN ? "RXVLAN " : "",
3725 nn->cap & NFP_NET_CFG_CTRL_TXVLAN ? "TXVLAN " : "",
3726 nn->cap & NFP_NET_CFG_CTRL_SCATTER ? "SCATTER " : "",
3727 nn->cap & NFP_NET_CFG_CTRL_GATHER ? "GATHER " : "",
28063be6
EP
3728 nn->cap & NFP_NET_CFG_CTRL_LSO ? "TSO1 " : "",
3729 nn->cap & NFP_NET_CFG_CTRL_LSO2 ? "TSO2 " : "",
611bdd49
EP
3730 nn->cap & NFP_NET_CFG_CTRL_RSS ? "RSS1 " : "",
3731 nn->cap & NFP_NET_CFG_CTRL_RSS2 ? "RSS2 " : "",
b64052fc 3732 nn->cap & NFP_NET_CFG_CTRL_CTAG_FILTER ? "CTAG_FILTER " : "",
4c352362
JK
3733 nn->cap & NFP_NET_CFG_CTRL_MSIXAUTO ? "AUTOMASK " : "",
3734 nn->cap & NFP_NET_CFG_CTRL_IRQMOD ? "IRQMOD " : "",
3735 nn->cap & NFP_NET_CFG_CTRL_VXLAN ? "VXLAN " : "",
7533fdc0 3736 nn->cap & NFP_NET_CFG_CTRL_NVGRE ? "NVGRE " : "",
ddb98d94 3737 nn->cap & NFP_NET_CFG_CTRL_CSUM_COMPLETE ?
9d372759 3738 "RXCSUM_COMPLETE " : "",
bb45e51c
JK
3739 nn->cap & NFP_NET_CFG_CTRL_LIVE_ADDR ? "LIVE_ADDR " : "",
3740 nfp_app_extra_cap(nn->app, nn));
4c352362
JK
3741}
3742
3743/**
beba69ca 3744 * nfp_net_alloc() - Allocate netdev and related structure
4c352362 3745 * @pdev: PCI device
e38f5d11 3746 * @ctrl_bar: PCI IOMEM with vNIC config memory
a7b1ad08 3747 * @needs_netdev: Whether to allocate a netdev for this vNIC
4c352362
JK
3748 * @max_tx_rings: Maximum number of TX rings supported by device
3749 * @max_rx_rings: Maximum number of RX rings supported by device
3750 *
3751 * This function allocates a netdev device and fills in the initial
a7b1ad08
JK
3752 * part of the @struct nfp_net structure. In case of control device
3753 * nfp_net structure is allocated without the netdev.
4c352362
JK
3754 *
3755 * Return: NFP Net device structure, or ERR_PTR on error.
3756 */
e38f5d11
JK
3757struct nfp_net *
3758nfp_net_alloc(struct pci_dev *pdev, void __iomem *ctrl_bar, bool needs_netdev,
3759 unsigned int max_tx_rings, unsigned int max_rx_rings)
4c352362 3760{
4c352362 3761 struct nfp_net *nn;
83ec8857 3762 int err;
4c352362 3763
a7b1ad08
JK
3764 if (needs_netdev) {
3765 struct net_device *netdev;
4c352362 3766
a7b1ad08
JK
3767 netdev = alloc_etherdev_mqs(sizeof(struct nfp_net),
3768 max_tx_rings, max_rx_rings);
3769 if (!netdev)
3770 return ERR_PTR(-ENOMEM);
3771
3772 SET_NETDEV_DEV(netdev, &pdev->dev);
3773 nn = netdev_priv(netdev);
3774 nn->dp.netdev = netdev;
3775 } else {
3776 nn = vzalloc(sizeof(*nn));
3777 if (!nn)
3778 return ERR_PTR(-ENOMEM);
3779 }
4c352362 3780
79c12a75 3781 nn->dp.dev = &pdev->dev;
e38f5d11 3782 nn->dp.ctrl_bar = ctrl_bar;
4c352362
JK
3783 nn->pdev = pdev;
3784
3785 nn->max_tx_rings = max_tx_rings;
3786 nn->max_rx_rings = max_rx_rings;
3787
79c12a75
JK
3788 nn->dp.num_tx_rings = min_t(unsigned int,
3789 max_tx_rings, num_online_cpus());
3790 nn->dp.num_rx_rings = min_t(unsigned int, max_rx_rings,
cbeaf7aa 3791 netif_get_num_default_rss_queues());
4c352362 3792
79c12a75
JK
3793 nn->dp.num_r_vecs = max(nn->dp.num_tx_rings, nn->dp.num_rx_rings);
3794 nn->dp.num_r_vecs = min_t(unsigned int,
3795 nn->dp.num_r_vecs, num_online_cpus());
4b27a1eb 3796
79c12a75
JK
3797 nn->dp.txd_cnt = NFP_NET_TX_DESCS_DEFAULT;
3798 nn->dp.rxd_cnt = NFP_NET_RX_DESCS_DEFAULT;
4c352362 3799
3ed77bf7 3800 sema_init(&nn->bar_lock, 1);
dd5b2498 3801
4c352362
JK
3802 spin_lock_init(&nn->reconfig_lock);
3803 spin_lock_init(&nn->link_status_lock);
3804
3248f77f 3805 timer_setup(&nn->reconfig_timer, nfp_net_reconfig_timer, 0);
3d780b92 3806
83ec8857
JK
3807 err = nfp_net_tlv_caps_parse(&nn->pdev->dev, nn->dp.ctrl_bar,
3808 &nn->tlv_caps);
3809 if (err)
3810 goto err_free_nn;
3811
e2c7114a
JK
3812 err = nfp_ccm_mbox_alloc(nn);
3813 if (err)
3814 goto err_free_nn;
3815
4c352362 3816 return nn;
83ec8857
JK
3817
3818err_free_nn:
3819 if (nn->dp.netdev)
3820 free_netdev(nn->dp.netdev);
3821 else
3822 vfree(nn);
3823 return ERR_PTR(err);
4c352362
JK
3824}
3825
3826/**
beba69ca 3827 * nfp_net_free() - Undo what @nfp_net_alloc() did
4c352362
JK
3828 * @nn: NFP Net device to reconfigure
3829 */
beba69ca 3830void nfp_net_free(struct nfp_net *nn)
4c352362 3831{
9ad716b9 3832 WARN_ON(timer_pending(&nn->reconfig_timer) || nn->reconfig_posted);
e2c7114a 3833 nfp_ccm_mbox_free(nn);
dd5b2498 3834
a7b1ad08
JK
3835 if (nn->dp.netdev)
3836 free_netdev(nn->dp.netdev);
3837 else
3838 vfree(nn);
4c352362
JK
3839}
3840
9ff304bf
JK
3841/**
3842 * nfp_net_rss_key_sz() - Get current size of the RSS key
3843 * @nn: NFP Net device instance
3844 *
3845 * Return: size of the RSS key for currently selected hash function.
3846 */
3847unsigned int nfp_net_rss_key_sz(struct nfp_net *nn)
3848{
3849 switch (nn->rss_hfunc) {
3850 case ETH_RSS_HASH_TOP:
3851 return NFP_NET_CFG_RSS_KEY_SZ;
3852 case ETH_RSS_HASH_XOR:
3853 return 0;
3854 case ETH_RSS_HASH_CRC32:
3855 return 4;
3856 }
3857
3858 nn_warn(nn, "Unknown hash function: %u\n", nn->rss_hfunc);
3859 return 0;
3860}
3861
4c352362
JK
3862/**
3863 * nfp_net_rss_init() - Set the initial RSS parameters
3864 * @nn: NFP Net device to reconfigure
3865 */
3866static void nfp_net_rss_init(struct nfp_net *nn)
3867{
9ff304bf
JK
3868 unsigned long func_bit, rss_cap_hfunc;
3869 u32 reg;
3870
3871 /* Read the RSS function capability and select first supported func */
3872 reg = nn_readl(nn, NFP_NET_CFG_RSS_CAP);
3873 rss_cap_hfunc = FIELD_GET(NFP_NET_CFG_RSS_CAP_HFUNC, reg);
3874 if (!rss_cap_hfunc)
3875 rss_cap_hfunc = FIELD_GET(NFP_NET_CFG_RSS_CAP_HFUNC,
3876 NFP_NET_CFG_RSS_TOEPLITZ);
3877
3878 func_bit = find_first_bit(&rss_cap_hfunc, NFP_NET_CFG_RSS_HFUNCS);
3879 if (func_bit == NFP_NET_CFG_RSS_HFUNCS) {
79c12a75 3880 dev_warn(nn->dp.dev,
9ff304bf
JK
3881 "Bad RSS config, defaulting to Toeplitz hash\n");
3882 func_bit = ETH_RSS_HASH_TOP_BIT;
3883 }
3884 nn->rss_hfunc = 1 << func_bit;
3885
3886 netdev_rss_key_fill(nn->rss_key, nfp_net_rss_key_sz(nn));
4c352362 3887
1e9e10d0 3888 nfp_net_rss_init_itbl(nn);
4c352362
JK
3889
3890 /* Enable IPv4/IPv6 TCP by default */
3891 nn->rss_cfg = NFP_NET_CFG_RSS_IPV4_TCP |
3892 NFP_NET_CFG_RSS_IPV6_TCP |
9ff304bf 3893 FIELD_PREP(NFP_NET_CFG_RSS_HFUNC, nn->rss_hfunc) |
4c352362
JK
3894 NFP_NET_CFG_RSS_MASK;
3895}
3896
3897/**
3898 * nfp_net_irqmod_init() - Set the initial IRQ moderation parameters
3899 * @nn: NFP Net device to reconfigure
3900 */
3901static void nfp_net_irqmod_init(struct nfp_net *nn)
3902{
3903 nn->rx_coalesce_usecs = 50;
3904 nn->rx_coalesce_max_frames = 64;
3905 nn->tx_coalesce_usecs = 50;
3906 nn->tx_coalesce_max_frames = 64;
3907}
3908
a7b1ad08 3909static void nfp_net_netdev_init(struct nfp_net *nn)
4c352362 3910{
beba69ca 3911 struct net_device *netdev = nn->dp.netdev;
611bdd49 3912
9d372759 3913 nfp_net_write_mac_addr(nn, nn->dp.netdev->dev_addr);
4c352362 3914
a7b1ad08 3915 netdev->mtu = nn->dp.mtu;
4c352362
JK
3916
3917 /* Advertise/enable offloads based on capabilities
3918 *
3919 * Note: netdev->features show the currently enabled features
3920 * and netdev->hw_features advertises which features are
3921 * supported. By default we enable most features.
3922 */
9d372759
PC
3923 if (nn->cap & NFP_NET_CFG_CTRL_LIVE_ADDR)
3924 netdev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
3925
4c352362 3926 netdev->hw_features = NETIF_F_HIGHDMA;
ddb98d94 3927 if (nn->cap & NFP_NET_CFG_CTRL_RXCSUM_ANY) {
4c352362 3928 netdev->hw_features |= NETIF_F_RXCSUM;
ddb98d94 3929 nn->dp.ctrl |= nn->cap & NFP_NET_CFG_CTRL_RXCSUM_ANY;
4c352362
JK
3930 }
3931 if (nn->cap & NFP_NET_CFG_CTRL_TXCSUM) {
3932 netdev->hw_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM;
79c12a75 3933 nn->dp.ctrl |= NFP_NET_CFG_CTRL_TXCSUM;
4c352362
JK
3934 }
3935 if (nn->cap & NFP_NET_CFG_CTRL_GATHER) {
3936 netdev->hw_features |= NETIF_F_SG;
79c12a75 3937 nn->dp.ctrl |= NFP_NET_CFG_CTRL_GATHER;
4c352362 3938 }
28063be6
EP
3939 if ((nn->cap & NFP_NET_CFG_CTRL_LSO && nn->fw_ver.major > 2) ||
3940 nn->cap & NFP_NET_CFG_CTRL_LSO2) {
4c352362 3941 netdev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6;
28063be6
EP
3942 nn->dp.ctrl |= nn->cap & NFP_NET_CFG_CTRL_LSO2 ?:
3943 NFP_NET_CFG_CTRL_LSO;
4c352362 3944 }
a7b1ad08 3945 if (nn->cap & NFP_NET_CFG_CTRL_RSS_ANY)
4c352362 3946 netdev->hw_features |= NETIF_F_RXHASH;
7848418e 3947 if (nn->cap & NFP_NET_CFG_CTRL_VXLAN) {
4c352362 3948 if (nn->cap & NFP_NET_CFG_CTRL_LSO)
7848418e 3949 netdev->hw_features |= NETIF_F_GSO_UDP_TUNNEL;
641ca085 3950 netdev->udp_tunnel_nic_info = &nfp_udp_tunnels;
7848418e 3951 nn->dp.ctrl |= NFP_NET_CFG_CTRL_VXLAN;
4c352362 3952 }
7848418e
JK
3953 if (nn->cap & NFP_NET_CFG_CTRL_NVGRE) {
3954 if (nn->cap & NFP_NET_CFG_CTRL_LSO)
3955 netdev->hw_features |= NETIF_F_GSO_GRE;
3956 nn->dp.ctrl |= NFP_NET_CFG_CTRL_NVGRE;
3957 }
3958 if (nn->cap & (NFP_NET_CFG_CTRL_VXLAN | NFP_NET_CFG_CTRL_NVGRE))
3959 netdev->hw_enc_features = netdev->hw_features;
4c352362
JK
3960
3961 netdev->vlan_features = netdev->hw_features;
3962
3963 if (nn->cap & NFP_NET_CFG_CTRL_RXVLAN) {
3964 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_RX;
79c12a75 3965 nn->dp.ctrl |= NFP_NET_CFG_CTRL_RXVLAN;
4c352362
JK
3966 }
3967 if (nn->cap & NFP_NET_CFG_CTRL_TXVLAN) {
28063be6
EP
3968 if (nn->cap & NFP_NET_CFG_CTRL_LSO2) {
3969 nn_warn(nn, "Device advertises both TSO2 and TXVLAN. Refusing to enable TXVLAN.\n");
3970 } else {
3971 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_TX;
3972 nn->dp.ctrl |= NFP_NET_CFG_CTRL_TXVLAN;
3973 }
4c352362 3974 }
b64052fc
PC
3975 if (nn->cap & NFP_NET_CFG_CTRL_CTAG_FILTER) {
3976 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_FILTER;
3977 nn->dp.ctrl |= NFP_NET_CFG_CTRL_CTAG_FILTER;
3978 }
4c352362
JK
3979
3980 netdev->features = netdev->hw_features;
3981
0b9de4ca 3982 if (nfp_app_has_tc(nn->app) && nn->port)
7533fdc0
JK
3983 netdev->hw_features |= NETIF_F_HW_TC;
3984
4c352362
JK
3985 /* Advertise but disable TSO by default. */
3986 netdev->features &= ~(NETIF_F_TSO | NETIF_F_TSO6);
28063be6 3987 nn->dp.ctrl &= ~NFP_NET_CFG_CTRL_LSO_ANY;
4c352362 3988
a7b1ad08
JK
3989 /* Finalise the netdev setup */
3990 netdev->netdev_ops = &nfp_net_netdev_ops;
3991 netdev->watchdog_timeo = msecs_to_jiffies(5 * 1000);
3992
3993 /* MTU range: 68 - hw-specific max */
3994 netdev->min_mtu = ETH_MIN_MTU;
3995 netdev->max_mtu = nn->max_mtu;
3996
0d592e52
JK
3997 netdev->gso_max_segs = NFP_NET_LSO_MAX_SEGS;
3998
a7b1ad08
JK
3999 netif_carrier_off(netdev);
4000
4001 nfp_net_set_ethtool_ops(netdev);
4002}
4003
545bfa7a 4004static int nfp_net_read_caps(struct nfp_net *nn)
a7b1ad08 4005{
a7b1ad08
JK
4006 /* Get some of the read-only fields from the BAR */
4007 nn->cap = nn_readl(nn, NFP_NET_CFG_CAP);
4008 nn->max_mtu = nn_readl(nn, NFP_NET_CFG_MAX_MTU);
4009
64a919a9
JK
4010 /* ABI 4.x and ctrl vNIC always use chained metadata, in other cases
4011 * we allow use of non-chained metadata if RSS(v1) is the only
4012 * advertised capability requiring metadata.
4013 */
a7b1ad08 4014 nn->dp.chained_metadata_format = nn->fw_ver.major == 4 ||
77ece8d5 4015 !nn->dp.netdev ||
64a919a9 4016 !(nn->cap & NFP_NET_CFG_CTRL_RSS) ||
a7b1ad08 4017 nn->cap & NFP_NET_CFG_CTRL_CHAIN_META;
64a919a9
JK
4018 /* RSS(v1) uses non-chained metadata format, except in ABI 4.x where
4019 * it has the same meaning as RSSv2.
4020 */
a7b1ad08
JK
4021 if (nn->dp.chained_metadata_format && nn->fw_ver.major != 4)
4022 nn->cap &= ~NFP_NET_CFG_CTRL_RSS;
4023
4024 /* Determine RX packet/metadata boundary offset */
4025 if (nn->fw_ver.major >= 2) {
4026 u32 reg;
4027
4028 reg = nn_readl(nn, NFP_NET_CFG_RX_OFFSET);
4029 if (reg > NFP_NET_MAX_PREPEND) {
4030 nn_err(nn, "Invalid rx offset: %d\n", reg);
4031 return -EINVAL;
4032 }
4033 nn->dp.rx_offset = reg;
4034 } else {
4035 nn->dp.rx_offset = NFP_NET_RX_OFFSET;
4036 }
4037
78a0a65f
JK
4038 /* For control vNICs mask out the capabilities app doesn't want. */
4039 if (!nn->dp.netdev)
4040 nn->cap &= nn->app->type->ctrl_cap_mask;
4041
545bfa7a
JK
4042 return 0;
4043}
4044
4045/**
4046 * nfp_net_init() - Initialise/finalise the nfp_net structure
4047 * @nn: NFP Net device structure
4048 *
4049 * Return: 0 on success or negative errno on error.
4050 */
4051int nfp_net_init(struct nfp_net *nn)
4052{
4053 int err;
4054
4055 nn->dp.rx_dma_dir = DMA_FROM_DEVICE;
4056
4057 err = nfp_net_read_caps(nn);
4058 if (err)
4059 return err;
4060
a7b1ad08 4061 /* Set default MTU and Freelist buffer size */
9bbdd41b 4062 if (!nfp_net_is_data_vnic(nn) && nn->app->ctrl_mtu) {
bc2796db 4063 nn->dp.mtu = min(nn->app->ctrl_mtu, nn->max_mtu);
9bbdd41b 4064 } else if (nn->max_mtu < NFP_NET_DEFAULT_MTU) {
a7b1ad08 4065 nn->dp.mtu = nn->max_mtu;
9bbdd41b 4066 } else {
a7b1ad08 4067 nn->dp.mtu = NFP_NET_DEFAULT_MTU;
9bbdd41b 4068 }
a7b1ad08
JK
4069 nn->dp.fl_bufsz = nfp_net_calc_fl_bufsz(&nn->dp);
4070
79ca38e8
JK
4071 if (nfp_app_ctrl_uses_data_vnics(nn->app))
4072 nn->dp.ctrl |= nn->cap & NFP_NET_CFG_CTRL_CMSG_DATA;
4073
a7b1ad08
JK
4074 if (nn->cap & NFP_NET_CFG_CTRL_RSS_ANY) {
4075 nfp_net_rss_init(nn);
4076 nn->dp.ctrl |= nn->cap & NFP_NET_CFG_CTRL_RSS2 ?:
4077 NFP_NET_CFG_CTRL_RSS;
4078 }
4079
4c352362
JK
4080 /* Allow L2 Broadcast and Multicast through by default, if supported */
4081 if (nn->cap & NFP_NET_CFG_CTRL_L2BC)
79c12a75 4082 nn->dp.ctrl |= NFP_NET_CFG_CTRL_L2BC;
4c352362
JK
4083
4084 /* Allow IRQ moderation, if supported */
4085 if (nn->cap & NFP_NET_CFG_CTRL_IRQMOD) {
4086 nfp_net_irqmod_init(nn);
79c12a75 4087 nn->dp.ctrl |= NFP_NET_CFG_CTRL_IRQMOD;
4c352362
JK
4088 }
4089
4c352362
JK
4090 /* Stash the re-configuration queue away. First odd queue in TX Bar */
4091 nn->qcp_cfg = nn->tx_bar + NFP_QCP_QUEUE_ADDR_SZ;
4092
4093 /* Make sure the FW knows the netdev is supposed to be disabled here */
4094 nn_writel(nn, NFP_NET_CFG_CTRL, 0);
4095 nn_writeq(nn, NFP_NET_CFG_TXRS_ENABLE, 0);
4096 nn_writeq(nn, NFP_NET_CFG_RXRS_ENABLE, 0);
4097 err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_RING |
4098 NFP_NET_CFG_UPDATE_GEN);
4099 if (err)
4100 return err;
4101
232eeb1f 4102 if (nn->dp.netdev) {
0a72d833
JK
4103 nfp_net_netdev_init(nn);
4104
e2c7114a 4105 err = nfp_ccm_mbox_init(nn);
232eeb1f
JK
4106 if (err)
4107 return err;
e2c7114a
JK
4108
4109 err = nfp_net_tls_init(nn);
4110 if (err)
4111 goto err_clean_mbox;
232eeb1f
JK
4112 }
4113
beba69ca 4114 nfp_net_vecs_init(nn);
4c352362 4115
a7b1ad08
JK
4116 if (!nn->dp.netdev)
4117 return 0;
4118 return register_netdev(nn->dp.netdev);
e2c7114a
JK
4119
4120err_clean_mbox:
4121 nfp_ccm_mbox_clean(nn);
4122 return err;
4c352362
JK
4123}
4124
4125/**
beba69ca
JK
4126 * nfp_net_clean() - Undo what nfp_net_init() did.
4127 * @nn: NFP Net device structure
4c352362 4128 */
beba69ca 4129void nfp_net_clean(struct nfp_net *nn)
4c352362 4130{
a7b1ad08
JK
4131 if (!nn->dp.netdev)
4132 return;
4133
6f14f443 4134 unregister_netdev(nn->dp.netdev);
e2c7114a 4135 nfp_ccm_mbox_clean(nn);
9ad716b9 4136 nfp_net_reconfig_wait_posted(nn);
4c352362 4137}