Merge branch 'x86-pti-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git...
[linux-2.6-block.git] / drivers / net / ethernet / pensando / ionic / ionic_txrx.c
1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright(c) 2017 - 2019 Pensando Systems, Inc */
3
4 #include <linux/ip.h>
5 #include <linux/ipv6.h>
6 #include <linux/if_vlan.h>
7 #include <net/ip6_checksum.h>
8
9 #include "ionic.h"
10 #include "ionic_lif.h"
11 #include "ionic_txrx.h"
12
13 static void ionic_rx_clean(struct ionic_queue *q, struct ionic_desc_info *desc_info,
14                            struct ionic_cq_info *cq_info, void *cb_arg);
15
16 static inline void ionic_txq_post(struct ionic_queue *q, bool ring_dbell,
17                                   ionic_desc_cb cb_func, void *cb_arg)
18 {
19         DEBUG_STATS_TXQ_POST(q_to_qcq(q), q->head->desc, ring_dbell);
20
21         ionic_q_post(q, ring_dbell, cb_func, cb_arg);
22 }
23
24 static inline void ionic_rxq_post(struct ionic_queue *q, bool ring_dbell,
25                                   ionic_desc_cb cb_func, void *cb_arg)
26 {
27         ionic_q_post(q, ring_dbell, cb_func, cb_arg);
28
29         DEBUG_STATS_RX_BUFF_CNT(q_to_qcq(q));
30 }
31
32 static inline struct netdev_queue *q_to_ndq(struct ionic_queue *q)
33 {
34         return netdev_get_tx_queue(q->lif->netdev, q->index);
35 }
36
37 static struct sk_buff *ionic_rx_skb_alloc(struct ionic_queue *q,
38                                           unsigned int len, bool frags)
39 {
40         struct ionic_lif *lif = q->lif;
41         struct ionic_rx_stats *stats;
42         struct net_device *netdev;
43         struct sk_buff *skb;
44
45         netdev = lif->netdev;
46         stats = q_to_rx_stats(q);
47
48         if (frags)
49                 skb = napi_get_frags(&q_to_qcq(q)->napi);
50         else
51                 skb = netdev_alloc_skb_ip_align(netdev, len);
52
53         if (unlikely(!skb)) {
54                 net_warn_ratelimited("%s: SKB alloc failed on %s!\n",
55                                      netdev->name, q->name);
56                 stats->alloc_err++;
57                 return NULL;
58         }
59
60         return skb;
61 }
62
63 static struct sk_buff *ionic_rx_frags(struct ionic_queue *q,
64                                       struct ionic_desc_info *desc_info,
65                                       struct ionic_cq_info *cq_info)
66 {
67         struct ionic_rxq_comp *comp = cq_info->cq_desc;
68         struct device *dev = q->lif->ionic->dev;
69         struct ionic_page_info *page_info;
70         struct sk_buff *skb;
71         unsigned int i;
72         u16 frag_len;
73         u16 len;
74
75         page_info = &desc_info->pages[0];
76         len = le16_to_cpu(comp->len);
77
78         prefetch(page_address(page_info->page) + NET_IP_ALIGN);
79
80         skb = ionic_rx_skb_alloc(q, len, true);
81         if (unlikely(!skb))
82                 return NULL;
83
84         i = comp->num_sg_elems + 1;
85         do {
86                 if (unlikely(!page_info->page)) {
87                         struct napi_struct *napi = &q_to_qcq(q)->napi;
88
89                         napi->skb = NULL;
90                         dev_kfree_skb(skb);
91                         return NULL;
92                 }
93
94                 frag_len = min(len, (u16)PAGE_SIZE);
95                 len -= frag_len;
96
97                 dma_unmap_page(dev, dma_unmap_addr(page_info, dma_addr),
98                                PAGE_SIZE, DMA_FROM_DEVICE);
99                 skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags,
100                                 page_info->page, 0, frag_len, PAGE_SIZE);
101                 page_info->page = NULL;
102                 page_info++;
103                 i--;
104         } while (i > 0);
105
106         return skb;
107 }
108
109 static struct sk_buff *ionic_rx_copybreak(struct ionic_queue *q,
110                                           struct ionic_desc_info *desc_info,
111                                           struct ionic_cq_info *cq_info)
112 {
113         struct ionic_rxq_comp *comp = cq_info->cq_desc;
114         struct device *dev = q->lif->ionic->dev;
115         struct ionic_page_info *page_info;
116         struct sk_buff *skb;
117         u16 len;
118
119         page_info = &desc_info->pages[0];
120         len = le16_to_cpu(comp->len);
121
122         skb = ionic_rx_skb_alloc(q, len, false);
123         if (unlikely(!skb))
124                 return NULL;
125
126         if (unlikely(!page_info->page)) {
127                 dev_kfree_skb(skb);
128                 return NULL;
129         }
130
131         dma_sync_single_for_cpu(dev, dma_unmap_addr(page_info, dma_addr),
132                                 len, DMA_FROM_DEVICE);
133         skb_copy_to_linear_data(skb, page_address(page_info->page), len);
134         dma_sync_single_for_device(dev, dma_unmap_addr(page_info, dma_addr),
135                                    len, DMA_FROM_DEVICE);
136
137         skb_put(skb, len);
138         skb->protocol = eth_type_trans(skb, q->lif->netdev);
139
140         return skb;
141 }
142
143 static void ionic_rx_clean(struct ionic_queue *q, struct ionic_desc_info *desc_info,
144                            struct ionic_cq_info *cq_info, void *cb_arg)
145 {
146         struct ionic_rxq_comp *comp = cq_info->cq_desc;
147         struct ionic_qcq *qcq = q_to_qcq(q);
148         struct ionic_rx_stats *stats;
149         struct net_device *netdev;
150         struct sk_buff *skb;
151
152         stats = q_to_rx_stats(q);
153         netdev = q->lif->netdev;
154
155         if (comp->status)
156                 return;
157
158         /* no packet processing while resetting */
159         if (unlikely(test_bit(IONIC_LIF_QUEUE_RESET, q->lif->state)))
160                 return;
161
162         stats->pkts++;
163         stats->bytes += le16_to_cpu(comp->len);
164
165         if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak)
166                 skb = ionic_rx_copybreak(q, desc_info, cq_info);
167         else
168                 skb = ionic_rx_frags(q, desc_info, cq_info);
169
170         if (unlikely(!skb))
171                 return;
172
173         skb_record_rx_queue(skb, q->index);
174
175         if (likely(netdev->features & NETIF_F_RXHASH)) {
176                 switch (comp->pkt_type_color & IONIC_RXQ_COMP_PKT_TYPE_MASK) {
177                 case IONIC_PKT_TYPE_IPV4:
178                 case IONIC_PKT_TYPE_IPV6:
179                         skb_set_hash(skb, le32_to_cpu(comp->rss_hash),
180                                      PKT_HASH_TYPE_L3);
181                         break;
182                 case IONIC_PKT_TYPE_IPV4_TCP:
183                 case IONIC_PKT_TYPE_IPV6_TCP:
184                 case IONIC_PKT_TYPE_IPV4_UDP:
185                 case IONIC_PKT_TYPE_IPV6_UDP:
186                         skb_set_hash(skb, le32_to_cpu(comp->rss_hash),
187                                      PKT_HASH_TYPE_L4);
188                         break;
189                 }
190         }
191
192         if (likely(netdev->features & NETIF_F_RXCSUM)) {
193                 if (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_CALC) {
194                         skb->ip_summed = CHECKSUM_COMPLETE;
195                         skb->csum = (__wsum)le16_to_cpu(comp->csum);
196                         stats->csum_complete++;
197                 }
198         } else {
199                 stats->csum_none++;
200         }
201
202         if (unlikely((comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_TCP_BAD) ||
203                      (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_UDP_BAD) ||
204                      (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_IP_BAD)))
205                 stats->csum_error++;
206
207         if (likely(netdev->features & NETIF_F_HW_VLAN_CTAG_RX)) {
208                 if (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_VLAN)
209                         __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
210                                                le16_to_cpu(comp->vlan_tci));
211         }
212
213         if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak)
214                 napi_gro_receive(&qcq->napi, skb);
215         else
216                 napi_gro_frags(&qcq->napi);
217 }
218
219 static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)
220 {
221         struct ionic_rxq_comp *comp = cq_info->cq_desc;
222         struct ionic_queue *q = cq->bound_q;
223         struct ionic_desc_info *desc_info;
224
225         if (!color_match(comp->pkt_type_color, cq->done_color))
226                 return false;
227
228         /* check for empty queue */
229         if (q->tail->index == q->head->index)
230                 return false;
231
232         desc_info = q->tail;
233         if (desc_info->index != le16_to_cpu(comp->comp_index))
234                 return false;
235
236         q->tail = desc_info->next;
237
238         /* clean the related q entry, only one per qc completion */
239         ionic_rx_clean(q, desc_info, cq_info, desc_info->cb_arg);
240
241         desc_info->cb = NULL;
242         desc_info->cb_arg = NULL;
243
244         return true;
245 }
246
247 static u32 ionic_rx_walk_cq(struct ionic_cq *rxcq, u32 limit)
248 {
249         u32 work_done = 0;
250
251         while (ionic_rx_service(rxcq, rxcq->tail)) {
252                 if (rxcq->tail->last)
253                         rxcq->done_color = !rxcq->done_color;
254                 rxcq->tail = rxcq->tail->next;
255                 DEBUG_STATS_CQE_CNT(rxcq);
256
257                 if (++work_done >= limit)
258                         break;
259         }
260
261         return work_done;
262 }
263
264 void ionic_rx_flush(struct ionic_cq *cq)
265 {
266         struct ionic_dev *idev = &cq->lif->ionic->idev;
267         u32 work_done;
268
269         work_done = ionic_rx_walk_cq(cq, cq->num_descs);
270
271         if (work_done)
272                 ionic_intr_credits(idev->intr_ctrl, cq->bound_intr->index,
273                                    work_done, IONIC_INTR_CRED_RESET_COALESCE);
274 }
275
276 static struct page *ionic_rx_page_alloc(struct ionic_queue *q,
277                                         dma_addr_t *dma_addr)
278 {
279         struct ionic_lif *lif = q->lif;
280         struct ionic_rx_stats *stats;
281         struct net_device *netdev;
282         struct device *dev;
283         struct page *page;
284
285         netdev = lif->netdev;
286         dev = lif->ionic->dev;
287         stats = q_to_rx_stats(q);
288         page = alloc_page(GFP_ATOMIC);
289         if (unlikely(!page)) {
290                 net_err_ratelimited("%s: Page alloc failed on %s!\n",
291                                     netdev->name, q->name);
292                 stats->alloc_err++;
293                 return NULL;
294         }
295
296         *dma_addr = dma_map_page(dev, page, 0, PAGE_SIZE, DMA_FROM_DEVICE);
297         if (unlikely(dma_mapping_error(dev, *dma_addr))) {
298                 __free_page(page);
299                 net_err_ratelimited("%s: DMA single map failed on %s!\n",
300                                     netdev->name, q->name);
301                 stats->dma_map_err++;
302                 return NULL;
303         }
304
305         return page;
306 }
307
308 static void ionic_rx_page_free(struct ionic_queue *q, struct page *page,
309                                dma_addr_t dma_addr)
310 {
311         struct ionic_lif *lif = q->lif;
312         struct net_device *netdev;
313         struct device *dev;
314
315         netdev = lif->netdev;
316         dev = lif->ionic->dev;
317
318         if (unlikely(!page)) {
319                 net_err_ratelimited("%s: Trying to free unallocated buffer on %s!\n",
320                                     netdev->name, q->name);
321                 return;
322         }
323
324         dma_unmap_page(dev, dma_addr, PAGE_SIZE, DMA_FROM_DEVICE);
325
326         __free_page(page);
327 }
328
329 #define IONIC_RX_RING_DOORBELL_STRIDE           ((1 << 5) - 1)
330 #define IONIC_RX_RING_HEAD_BUF_SZ               2048
331
332 void ionic_rx_fill(struct ionic_queue *q)
333 {
334         struct net_device *netdev = q->lif->netdev;
335         struct ionic_desc_info *desc_info;
336         struct ionic_page_info *page_info;
337         struct ionic_rxq_sg_desc *sg_desc;
338         struct ionic_rxq_sg_elem *sg_elem;
339         struct ionic_rxq_desc *desc;
340         unsigned int nfrags;
341         bool ring_doorbell;
342         unsigned int i, j;
343         unsigned int len;
344
345         len = netdev->mtu + ETH_HLEN;
346         nfrags = round_up(len, PAGE_SIZE) / PAGE_SIZE;
347
348         for (i = ionic_q_space_avail(q); i; i--) {
349                 desc_info = q->head;
350                 desc = desc_info->desc;
351                 sg_desc = desc_info->sg_desc;
352                 page_info = &desc_info->pages[0];
353
354                 if (page_info->page) { /* recycle the buffer */
355                         ring_doorbell = ((q->head->index + 1) &
356                                         IONIC_RX_RING_DOORBELL_STRIDE) == 0;
357                         ionic_rxq_post(q, ring_doorbell, ionic_rx_clean, NULL);
358                         continue;
359                 }
360
361                 /* fill main descriptor - pages[0] */
362                 desc->opcode = (nfrags > 1) ? IONIC_RXQ_DESC_OPCODE_SG :
363                                               IONIC_RXQ_DESC_OPCODE_SIMPLE;
364                 desc_info->npages = nfrags;
365                 page_info->page = ionic_rx_page_alloc(q, &page_info->dma_addr);
366                 if (unlikely(!page_info->page)) {
367                         desc->addr = 0;
368                         desc->len = 0;
369                         return;
370                 }
371                 desc->addr = cpu_to_le64(page_info->dma_addr);
372                 desc->len = cpu_to_le16(PAGE_SIZE);
373                 page_info++;
374
375                 /* fill sg descriptors - pages[1..n] */
376                 for (j = 0; j < nfrags - 1; j++) {
377                         if (page_info->page) /* recycle the sg buffer */
378                                 continue;
379
380                         sg_elem = &sg_desc->elems[j];
381                         page_info->page = ionic_rx_page_alloc(q, &page_info->dma_addr);
382                         if (unlikely(!page_info->page)) {
383                                 sg_elem->addr = 0;
384                                 sg_elem->len = 0;
385                                 return;
386                         }
387                         sg_elem->addr = cpu_to_le64(page_info->dma_addr);
388                         sg_elem->len = cpu_to_le16(PAGE_SIZE);
389                         page_info++;
390                 }
391
392                 ring_doorbell = ((q->head->index + 1) &
393                                 IONIC_RX_RING_DOORBELL_STRIDE) == 0;
394                 ionic_rxq_post(q, ring_doorbell, ionic_rx_clean, NULL);
395         }
396 }
397
398 static void ionic_rx_fill_cb(void *arg)
399 {
400         ionic_rx_fill(arg);
401 }
402
403 void ionic_rx_empty(struct ionic_queue *q)
404 {
405         struct ionic_desc_info *cur;
406         struct ionic_rxq_desc *desc;
407         unsigned int i;
408
409         for (cur = q->tail; cur != q->head; cur = cur->next) {
410                 desc = cur->desc;
411                 desc->addr = 0;
412                 desc->len = 0;
413
414                 for (i = 0; i < cur->npages; i++) {
415                         if (likely(cur->pages[i].page)) {
416                                 ionic_rx_page_free(q, cur->pages[i].page,
417                                                    cur->pages[i].dma_addr);
418                                 cur->pages[i].page = NULL;
419                                 cur->pages[i].dma_addr = 0;
420                         }
421                 }
422
423                 cur->cb_arg = NULL;
424         }
425 }
426
427 int ionic_rx_napi(struct napi_struct *napi, int budget)
428 {
429         struct ionic_qcq *qcq = napi_to_qcq(napi);
430         struct ionic_cq *rxcq = napi_to_cq(napi);
431         unsigned int qi = rxcq->bound_q->index;
432         struct ionic_dev *idev;
433         struct ionic_lif *lif;
434         struct ionic_cq *txcq;
435         u32 work_done = 0;
436         u32 flags = 0;
437
438         lif = rxcq->bound_q->lif;
439         idev = &lif->ionic->idev;
440         txcq = &lif->txqcqs[qi].qcq->cq;
441
442         ionic_tx_flush(txcq);
443
444         work_done = ionic_rx_walk_cq(rxcq, budget);
445
446         if (work_done)
447                 ionic_rx_fill_cb(rxcq->bound_q);
448
449         if (work_done < budget && napi_complete_done(napi, work_done)) {
450                 flags |= IONIC_INTR_CRED_UNMASK;
451                 DEBUG_STATS_INTR_REARM(rxcq->bound_intr);
452         }
453
454         if (work_done || flags) {
455                 flags |= IONIC_INTR_CRED_RESET_COALESCE;
456                 ionic_intr_credits(idev->intr_ctrl, rxcq->bound_intr->index,
457                                    work_done, flags);
458         }
459
460         DEBUG_STATS_NAPI_POLL(qcq, work_done);
461
462         return work_done;
463 }
464
465 static dma_addr_t ionic_tx_map_single(struct ionic_queue *q, void *data, size_t len)
466 {
467         struct ionic_tx_stats *stats = q_to_tx_stats(q);
468         struct device *dev = q->lif->ionic->dev;
469         dma_addr_t dma_addr;
470
471         dma_addr = dma_map_single(dev, data, len, DMA_TO_DEVICE);
472         if (dma_mapping_error(dev, dma_addr)) {
473                 net_warn_ratelimited("%s: DMA single map failed on %s!\n",
474                                      q->lif->netdev->name, q->name);
475                 stats->dma_map_err++;
476                 return 0;
477         }
478         return dma_addr;
479 }
480
481 static dma_addr_t ionic_tx_map_frag(struct ionic_queue *q, const skb_frag_t *frag,
482                                     size_t offset, size_t len)
483 {
484         struct ionic_tx_stats *stats = q_to_tx_stats(q);
485         struct device *dev = q->lif->ionic->dev;
486         dma_addr_t dma_addr;
487
488         dma_addr = skb_frag_dma_map(dev, frag, offset, len, DMA_TO_DEVICE);
489         if (dma_mapping_error(dev, dma_addr)) {
490                 net_warn_ratelimited("%s: DMA frag map failed on %s!\n",
491                                      q->lif->netdev->name, q->name);
492                 stats->dma_map_err++;
493         }
494         return dma_addr;
495 }
496
497 static void ionic_tx_clean(struct ionic_queue *q, struct ionic_desc_info *desc_info,
498                            struct ionic_cq_info *cq_info, void *cb_arg)
499 {
500         struct ionic_txq_sg_desc *sg_desc = desc_info->sg_desc;
501         struct ionic_txq_sg_elem *elem = sg_desc->elems;
502         struct ionic_tx_stats *stats = q_to_tx_stats(q);
503         struct ionic_txq_desc *desc = desc_info->desc;
504         struct device *dev = q->lif->ionic->dev;
505         u8 opcode, flags, nsge;
506         u16 queue_index;
507         unsigned int i;
508         u64 addr;
509
510         decode_txq_desc_cmd(le64_to_cpu(desc->cmd),
511                             &opcode, &flags, &nsge, &addr);
512
513         /* use unmap_single only if either this is not TSO,
514          * or this is first descriptor of a TSO
515          */
516         if (opcode != IONIC_TXQ_DESC_OPCODE_TSO ||
517             flags & IONIC_TXQ_DESC_FLAG_TSO_SOT)
518                 dma_unmap_single(dev, (dma_addr_t)addr,
519                                  le16_to_cpu(desc->len), DMA_TO_DEVICE);
520         else
521                 dma_unmap_page(dev, (dma_addr_t)addr,
522                                le16_to_cpu(desc->len), DMA_TO_DEVICE);
523
524         for (i = 0; i < nsge; i++, elem++)
525                 dma_unmap_page(dev, (dma_addr_t)le64_to_cpu(elem->addr),
526                                le16_to_cpu(elem->len), DMA_TO_DEVICE);
527
528         if (cb_arg) {
529                 struct sk_buff *skb = cb_arg;
530                 u32 len = skb->len;
531
532                 queue_index = skb_get_queue_mapping(skb);
533                 if (unlikely(__netif_subqueue_stopped(q->lif->netdev,
534                                                       queue_index))) {
535                         netif_wake_subqueue(q->lif->netdev, queue_index);
536                         q->wake++;
537                 }
538                 dev_kfree_skb_any(skb);
539                 stats->clean++;
540                 netdev_tx_completed_queue(q_to_ndq(q), 1, len);
541         }
542 }
543
544 void ionic_tx_flush(struct ionic_cq *cq)
545 {
546         struct ionic_txq_comp *comp = cq->tail->cq_desc;
547         struct ionic_dev *idev = &cq->lif->ionic->idev;
548         struct ionic_queue *q = cq->bound_q;
549         struct ionic_desc_info *desc_info;
550         unsigned int work_done = 0;
551
552         /* walk the completed cq entries */
553         while (work_done < cq->num_descs &&
554                color_match(comp->color, cq->done_color)) {
555
556                 /* clean the related q entries, there could be
557                  * several q entries completed for each cq completion
558                  */
559                 do {
560                         desc_info = q->tail;
561                         q->tail = desc_info->next;
562                         ionic_tx_clean(q, desc_info, cq->tail,
563                                        desc_info->cb_arg);
564                         desc_info->cb = NULL;
565                         desc_info->cb_arg = NULL;
566                 } while (desc_info->index != le16_to_cpu(comp->comp_index));
567
568                 if (cq->tail->last)
569                         cq->done_color = !cq->done_color;
570
571                 cq->tail = cq->tail->next;
572                 comp = cq->tail->cq_desc;
573                 DEBUG_STATS_CQE_CNT(cq);
574
575                 work_done++;
576         }
577
578         if (work_done)
579                 ionic_intr_credits(idev->intr_ctrl, cq->bound_intr->index,
580                                    work_done, 0);
581 }
582
583 static int ionic_tx_tcp_inner_pseudo_csum(struct sk_buff *skb)
584 {
585         int err;
586
587         err = skb_cow_head(skb, 0);
588         if (err)
589                 return err;
590
591         if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
592                 inner_ip_hdr(skb)->check = 0;
593                 inner_tcp_hdr(skb)->check =
594                         ~csum_tcpudp_magic(inner_ip_hdr(skb)->saddr,
595                                            inner_ip_hdr(skb)->daddr,
596                                            0, IPPROTO_TCP, 0);
597         } else if (skb->protocol == cpu_to_be16(ETH_P_IPV6)) {
598                 inner_tcp_hdr(skb)->check =
599                         ~csum_ipv6_magic(&inner_ipv6_hdr(skb)->saddr,
600                                          &inner_ipv6_hdr(skb)->daddr,
601                                          0, IPPROTO_TCP, 0);
602         }
603
604         return 0;
605 }
606
607 static int ionic_tx_tcp_pseudo_csum(struct sk_buff *skb)
608 {
609         int err;
610
611         err = skb_cow_head(skb, 0);
612         if (err)
613                 return err;
614
615         if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
616                 ip_hdr(skb)->check = 0;
617                 tcp_hdr(skb)->check =
618                         ~csum_tcpudp_magic(ip_hdr(skb)->saddr,
619                                            ip_hdr(skb)->daddr,
620                                            0, IPPROTO_TCP, 0);
621         } else if (skb->protocol == cpu_to_be16(ETH_P_IPV6)) {
622                 tcp_hdr(skb)->check =
623                         ~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
624                                          &ipv6_hdr(skb)->daddr,
625                                          0, IPPROTO_TCP, 0);
626         }
627
628         return 0;
629 }
630
631 static void ionic_tx_tso_post(struct ionic_queue *q, struct ionic_txq_desc *desc,
632                               struct sk_buff *skb,
633                               dma_addr_t addr, u8 nsge, u16 len,
634                               unsigned int hdrlen, unsigned int mss,
635                               bool outer_csum,
636                               u16 vlan_tci, bool has_vlan,
637                               bool start, bool done)
638 {
639         u8 flags = 0;
640         u64 cmd;
641
642         flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
643         flags |= outer_csum ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
644         flags |= start ? IONIC_TXQ_DESC_FLAG_TSO_SOT : 0;
645         flags |= done ? IONIC_TXQ_DESC_FLAG_TSO_EOT : 0;
646
647         cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_TSO, flags, nsge, addr);
648         desc->cmd = cpu_to_le64(cmd);
649         desc->len = cpu_to_le16(len);
650         desc->vlan_tci = cpu_to_le16(vlan_tci);
651         desc->hdr_len = cpu_to_le16(hdrlen);
652         desc->mss = cpu_to_le16(mss);
653
654         if (done) {
655                 skb_tx_timestamp(skb);
656                 netdev_tx_sent_queue(q_to_ndq(q), skb->len);
657                 ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb);
658         } else {
659                 ionic_txq_post(q, false, ionic_tx_clean, NULL);
660         }
661 }
662
663 static struct ionic_txq_desc *ionic_tx_tso_next(struct ionic_queue *q,
664                                                 struct ionic_txq_sg_elem **elem)
665 {
666         struct ionic_txq_sg_desc *sg_desc = q->head->sg_desc;
667         struct ionic_txq_desc *desc = q->head->desc;
668
669         *elem = sg_desc->elems;
670         return desc;
671 }
672
673 static int ionic_tx_tso(struct ionic_queue *q, struct sk_buff *skb)
674 {
675         struct ionic_tx_stats *stats = q_to_tx_stats(q);
676         struct ionic_desc_info *abort = q->head;
677         struct device *dev = q->lif->ionic->dev;
678         struct ionic_desc_info *rewind = abort;
679         struct ionic_txq_sg_elem *elem;
680         struct ionic_txq_desc *desc;
681         unsigned int frag_left = 0;
682         unsigned int offset = 0;
683         unsigned int len_left;
684         dma_addr_t desc_addr;
685         unsigned int hdrlen;
686         unsigned int nfrags;
687         unsigned int seglen;
688         u64 total_bytes = 0;
689         u64 total_pkts = 0;
690         unsigned int left;
691         unsigned int len;
692         unsigned int mss;
693         skb_frag_t *frag;
694         bool start, done;
695         bool outer_csum;
696         bool has_vlan;
697         u16 desc_len;
698         u8 desc_nsge;
699         u16 vlan_tci;
700         bool encap;
701         int err;
702
703         mss = skb_shinfo(skb)->gso_size;
704         nfrags = skb_shinfo(skb)->nr_frags;
705         len_left = skb->len - skb_headlen(skb);
706         outer_csum = (skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM) ||
707                      (skb_shinfo(skb)->gso_type & SKB_GSO_UDP_TUNNEL_CSUM);
708         has_vlan = !!skb_vlan_tag_present(skb);
709         vlan_tci = skb_vlan_tag_get(skb);
710         encap = skb->encapsulation;
711
712         /* Preload inner-most TCP csum field with IP pseudo hdr
713          * calculated with IP length set to zero.  HW will later
714          * add in length to each TCP segment resulting from the TSO.
715          */
716
717         if (encap)
718                 err = ionic_tx_tcp_inner_pseudo_csum(skb);
719         else
720                 err = ionic_tx_tcp_pseudo_csum(skb);
721         if (err)
722                 return err;
723
724         if (encap)
725                 hdrlen = skb_inner_transport_header(skb) - skb->data +
726                          inner_tcp_hdrlen(skb);
727         else
728                 hdrlen = skb_transport_offset(skb) + tcp_hdrlen(skb);
729
730         seglen = hdrlen + mss;
731         left = skb_headlen(skb);
732
733         desc = ionic_tx_tso_next(q, &elem);
734         start = true;
735
736         /* Chop skb->data up into desc segments */
737
738         while (left > 0) {
739                 len = min(seglen, left);
740                 frag_left = seglen - len;
741                 desc_addr = ionic_tx_map_single(q, skb->data + offset, len);
742                 if (dma_mapping_error(dev, desc_addr))
743                         goto err_out_abort;
744                 desc_len = len;
745                 desc_nsge = 0;
746                 left -= len;
747                 offset += len;
748                 if (nfrags > 0 && frag_left > 0)
749                         continue;
750                 done = (nfrags == 0 && left == 0);
751                 ionic_tx_tso_post(q, desc, skb,
752                                   desc_addr, desc_nsge, desc_len,
753                                   hdrlen, mss,
754                                   outer_csum,
755                                   vlan_tci, has_vlan,
756                                   start, done);
757                 total_pkts++;
758                 total_bytes += start ? len : len + hdrlen;
759                 desc = ionic_tx_tso_next(q, &elem);
760                 start = false;
761                 seglen = mss;
762         }
763
764         /* Chop skb frags into desc segments */
765
766         for (frag = skb_shinfo(skb)->frags; len_left; frag++) {
767                 offset = 0;
768                 left = skb_frag_size(frag);
769                 len_left -= left;
770                 nfrags--;
771                 stats->frags++;
772
773                 while (left > 0) {
774                         if (frag_left > 0) {
775                                 len = min(frag_left, left);
776                                 frag_left -= len;
777                                 elem->addr =
778                                     cpu_to_le64(ionic_tx_map_frag(q, frag,
779                                                                   offset, len));
780                                 if (dma_mapping_error(dev, elem->addr))
781                                         goto err_out_abort;
782                                 elem->len = cpu_to_le16(len);
783                                 elem++;
784                                 desc_nsge++;
785                                 left -= len;
786                                 offset += len;
787                                 if (nfrags > 0 && frag_left > 0)
788                                         continue;
789                                 done = (nfrags == 0 && left == 0);
790                                 ionic_tx_tso_post(q, desc, skb, desc_addr,
791                                                   desc_nsge, desc_len,
792                                                   hdrlen, mss, outer_csum,
793                                                   vlan_tci, has_vlan,
794                                                   start, done);
795                                 total_pkts++;
796                                 total_bytes += start ? len : len + hdrlen;
797                                 desc = ionic_tx_tso_next(q, &elem);
798                                 start = false;
799                         } else {
800                                 len = min(mss, left);
801                                 frag_left = mss - len;
802                                 desc_addr = ionic_tx_map_frag(q, frag,
803                                                               offset, len);
804                                 if (dma_mapping_error(dev, desc_addr))
805                                         goto err_out_abort;
806                                 desc_len = len;
807                                 desc_nsge = 0;
808                                 left -= len;
809                                 offset += len;
810                                 if (nfrags > 0 && frag_left > 0)
811                                         continue;
812                                 done = (nfrags == 0 && left == 0);
813                                 ionic_tx_tso_post(q, desc, skb, desc_addr,
814                                                   desc_nsge, desc_len,
815                                                   hdrlen, mss, outer_csum,
816                                                   vlan_tci, has_vlan,
817                                                   start, done);
818                                 total_pkts++;
819                                 total_bytes += start ? len : len + hdrlen;
820                                 desc = ionic_tx_tso_next(q, &elem);
821                                 start = false;
822                         }
823                 }
824         }
825
826         stats->pkts += total_pkts;
827         stats->bytes += total_bytes;
828         stats->tso++;
829
830         return 0;
831
832 err_out_abort:
833         while (rewind->desc != q->head->desc) {
834                 ionic_tx_clean(q, rewind, NULL, NULL);
835                 rewind = rewind->next;
836         }
837         q->head = abort;
838
839         return -ENOMEM;
840 }
841
842 static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb)
843 {
844         struct ionic_tx_stats *stats = q_to_tx_stats(q);
845         struct ionic_txq_desc *desc = q->head->desc;
846         struct device *dev = q->lif->ionic->dev;
847         dma_addr_t dma_addr;
848         bool has_vlan;
849         u8 flags = 0;
850         bool encap;
851         u64 cmd;
852
853         has_vlan = !!skb_vlan_tag_present(skb);
854         encap = skb->encapsulation;
855
856         dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb));
857         if (dma_mapping_error(dev, dma_addr))
858                 return -ENOMEM;
859
860         flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
861         flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
862
863         cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_PARTIAL,
864                                   flags, skb_shinfo(skb)->nr_frags, dma_addr);
865         desc->cmd = cpu_to_le64(cmd);
866         desc->len = cpu_to_le16(skb_headlen(skb));
867         desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));
868         desc->csum_start = cpu_to_le16(skb_checksum_start_offset(skb));
869         desc->csum_offset = cpu_to_le16(skb->csum_offset);
870
871         if (skb->csum_not_inet)
872                 stats->crc32_csum++;
873         else
874                 stats->csum++;
875
876         return 0;
877 }
878
879 static int ionic_tx_calc_no_csum(struct ionic_queue *q, struct sk_buff *skb)
880 {
881         struct ionic_tx_stats *stats = q_to_tx_stats(q);
882         struct ionic_txq_desc *desc = q->head->desc;
883         struct device *dev = q->lif->ionic->dev;
884         dma_addr_t dma_addr;
885         bool has_vlan;
886         u8 flags = 0;
887         bool encap;
888         u64 cmd;
889
890         has_vlan = !!skb_vlan_tag_present(skb);
891         encap = skb->encapsulation;
892
893         dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb));
894         if (dma_mapping_error(dev, dma_addr))
895                 return -ENOMEM;
896
897         flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
898         flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
899
900         cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_NONE,
901                                   flags, skb_shinfo(skb)->nr_frags, dma_addr);
902         desc->cmd = cpu_to_le64(cmd);
903         desc->len = cpu_to_le16(skb_headlen(skb));
904         desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));
905
906         stats->no_csum++;
907
908         return 0;
909 }
910
911 static int ionic_tx_skb_frags(struct ionic_queue *q, struct sk_buff *skb)
912 {
913         struct ionic_txq_sg_desc *sg_desc = q->head->sg_desc;
914         unsigned int len_left = skb->len - skb_headlen(skb);
915         struct ionic_txq_sg_elem *elem = sg_desc->elems;
916         struct ionic_tx_stats *stats = q_to_tx_stats(q);
917         struct device *dev = q->lif->ionic->dev;
918         dma_addr_t dma_addr;
919         skb_frag_t *frag;
920         u16 len;
921
922         for (frag = skb_shinfo(skb)->frags; len_left; frag++, elem++) {
923                 len = skb_frag_size(frag);
924                 elem->len = cpu_to_le16(len);
925                 dma_addr = ionic_tx_map_frag(q, frag, 0, len);
926                 if (dma_mapping_error(dev, dma_addr))
927                         return -ENOMEM;
928                 elem->addr = cpu_to_le64(dma_addr);
929                 len_left -= len;
930                 stats->frags++;
931         }
932
933         return 0;
934 }
935
936 static int ionic_tx(struct ionic_queue *q, struct sk_buff *skb)
937 {
938         struct ionic_tx_stats *stats = q_to_tx_stats(q);
939         int err;
940
941         /* set up the initial descriptor */
942         if (skb->ip_summed == CHECKSUM_PARTIAL)
943                 err = ionic_tx_calc_csum(q, skb);
944         else
945                 err = ionic_tx_calc_no_csum(q, skb);
946         if (err)
947                 return err;
948
949         /* add frags */
950         err = ionic_tx_skb_frags(q, skb);
951         if (err)
952                 return err;
953
954         skb_tx_timestamp(skb);
955         stats->pkts++;
956         stats->bytes += skb->len;
957
958         netdev_tx_sent_queue(q_to_ndq(q), skb->len);
959         ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb);
960
961         return 0;
962 }
963
964 static int ionic_tx_descs_needed(struct ionic_queue *q, struct sk_buff *skb)
965 {
966         struct ionic_tx_stats *stats = q_to_tx_stats(q);
967         int err;
968
969         /* If TSO, need roundup(skb->len/mss) descs */
970         if (skb_is_gso(skb))
971                 return (skb->len / skb_shinfo(skb)->gso_size) + 1;
972
973         /* If non-TSO, just need 1 desc and nr_frags sg elems */
974         if (skb_shinfo(skb)->nr_frags <= IONIC_TX_MAX_SG_ELEMS)
975                 return 1;
976
977         /* Too many frags, so linearize */
978         err = skb_linearize(skb);
979         if (err)
980                 return err;
981
982         stats->linearize++;
983
984         /* Need 1 desc and zero sg elems */
985         return 1;
986 }
987
988 static int ionic_maybe_stop_tx(struct ionic_queue *q, int ndescs)
989 {
990         int stopped = 0;
991
992         if (unlikely(!ionic_q_has_space(q, ndescs))) {
993                 netif_stop_subqueue(q->lif->netdev, q->index);
994                 q->stop++;
995                 stopped = 1;
996
997                 /* Might race with ionic_tx_clean, check again */
998                 smp_rmb();
999                 if (ionic_q_has_space(q, ndescs)) {
1000                         netif_wake_subqueue(q->lif->netdev, q->index);
1001                         stopped = 0;
1002                 }
1003         }
1004
1005         return stopped;
1006 }
1007
1008 netdev_tx_t ionic_start_xmit(struct sk_buff *skb, struct net_device *netdev)
1009 {
1010         u16 queue_index = skb_get_queue_mapping(skb);
1011         struct ionic_lif *lif = netdev_priv(netdev);
1012         struct ionic_queue *q;
1013         int ndescs;
1014         int err;
1015
1016         if (unlikely(!test_bit(IONIC_LIF_UP, lif->state))) {
1017                 dev_kfree_skb(skb);
1018                 return NETDEV_TX_OK;
1019         }
1020
1021         if (unlikely(!lif_to_txqcq(lif, queue_index)))
1022                 queue_index = 0;
1023         q = lif_to_txq(lif, queue_index);
1024
1025         ndescs = ionic_tx_descs_needed(q, skb);
1026         if (ndescs < 0)
1027                 goto err_out_drop;
1028
1029         if (unlikely(ionic_maybe_stop_tx(q, ndescs)))
1030                 return NETDEV_TX_BUSY;
1031
1032         if (skb_is_gso(skb))
1033                 err = ionic_tx_tso(q, skb);
1034         else
1035                 err = ionic_tx(q, skb);
1036
1037         if (err)
1038                 goto err_out_drop;
1039
1040         /* Stop the queue if there aren't descriptors for the next packet.
1041          * Since our SG lists per descriptor take care of most of the possible
1042          * fragmentation, we don't need to have many descriptors available.
1043          */
1044         ionic_maybe_stop_tx(q, 4);
1045
1046         return NETDEV_TX_OK;
1047
1048 err_out_drop:
1049         q->stop++;
1050         q->drop++;
1051         dev_kfree_skb(skb);
1052         return NETDEV_TX_OK;
1053 }