xen-netback: handle IPv6 TCP GSO packets from the guest
[linux-2.6-block.git] / drivers / net / xen-netback / netback.c
CommitLineData
f942dc25
IC
1/*
2 * Back-end of the driver for virtual network devices. This portion of the
3 * driver exports a 'unified' network-device interface that can be accessed
4 * by any operating system that implements a compatible front end. A
5 * reference front-end implementation can be found in:
6 * drivers/net/xen-netfront.c
7 *
8 * Copyright (c) 2002-2005, K A Fraser
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License version 2
12 * as published by the Free Software Foundation; or, when distributed
13 * separately from the Linux kernel or incorporated into other
14 * software packages, subject to the following license:
15 *
16 * Permission is hereby granted, free of charge, to any person obtaining a copy
17 * of this source file (the "Software"), to deal in the Software without
18 * restriction, including without limitation the rights to use, copy, modify,
19 * merge, publish, distribute, sublicense, and/or sell copies of the Software,
20 * and to permit persons to whom the Software is furnished to do so, subject to
21 * the following conditions:
22 *
23 * The above copyright notice and this permission notice shall be included in
24 * all copies or substantial portions of the Software.
25 *
26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
27 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
28 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
29 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
30 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
31 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
32 * IN THE SOFTWARE.
33 */
34
35#include "common.h"
36
37#include <linux/kthread.h>
38#include <linux/if_vlan.h>
39#include <linux/udp.h>
40
41#include <net/tcp.h>
42
ca981633 43#include <xen/xen.h>
f942dc25
IC
44#include <xen/events.h>
45#include <xen/interface/memory.h>
46
47#include <asm/xen/hypercall.h>
48#include <asm/xen/page.h>
49
e1f00a69
WL
50/* Provide an option to disable split event channels at load time as
51 * event channels are limited resource. Split event channels are
52 * enabled by default.
53 */
54bool separate_tx_rx_irq = 1;
55module_param(separate_tx_rx_irq, bool, 0644);
56
2810e5b9
WL
57/*
58 * This is the maximum slots a skb can have. If a guest sends a skb
59 * which exceeds this limit it is considered malicious.
60 */
37641494
WL
61#define FATAL_SKB_SLOTS_DEFAULT 20
62static unsigned int fatal_skb_slots = FATAL_SKB_SLOTS_DEFAULT;
63module_param(fatal_skb_slots, uint, 0444);
64
65/*
66 * To avoid confusion, we define XEN_NETBK_LEGACY_SLOTS_MAX indicating
67 * the maximum slots a valid packet can use. Now this value is defined
68 * to be XEN_NETIF_NR_SLOTS_MIN, which is supposed to be supported by
69 * all backend.
70 */
71#define XEN_NETBK_LEGACY_SLOTS_MAX XEN_NETIF_NR_SLOTS_MIN
2810e5b9 72
2810e5b9
WL
73/*
74 * If head != INVALID_PENDING_RING_IDX, it means this tx request is head of
75 * one or more merged tx requests, otherwise it is the continuation of
76 * previous tx request.
77 */
b3f980bd 78static inline int pending_tx_is_head(struct xenvif *vif, RING_IDX idx)
f942dc25 79{
b3f980bd 80 return vif->pending_tx_info[idx].head != INVALID_PENDING_RING_IDX;
f942dc25
IC
81}
82
7376419a
WL
83static void xenvif_idx_release(struct xenvif *vif, u16 pending_idx,
84 u8 status);
85
f942dc25
IC
86static void make_tx_response(struct xenvif *vif,
87 struct xen_netif_tx_request *txp,
88 s8 st);
b3f980bd
WL
89
90static inline int tx_work_todo(struct xenvif *vif);
91static inline int rx_work_todo(struct xenvif *vif);
92
f942dc25
IC
93static struct xen_netif_rx_response *make_rx_response(struct xenvif *vif,
94 u16 id,
95 s8 st,
96 u16 offset,
97 u16 size,
98 u16 flags);
99
b3f980bd 100static inline unsigned long idx_to_pfn(struct xenvif *vif,
ea066ad1 101 u16 idx)
f942dc25 102{
b3f980bd 103 return page_to_pfn(vif->mmap_pages[idx]);
f942dc25
IC
104}
105
b3f980bd 106static inline unsigned long idx_to_kaddr(struct xenvif *vif,
ea066ad1 107 u16 idx)
f942dc25 108{
b3f980bd 109 return (unsigned long)pfn_to_kaddr(idx_to_pfn(vif, idx));
f942dc25
IC
110}
111
2eba61d5
PD
112/* This is a miniumum size for the linear area to avoid lots of
113 * calls to __pskb_pull_tail() as we set up checksum offsets. The
114 * value 128 was chosen as it covers all IPv4 and most likely
115 * IPv6 headers.
f942dc25 116 */
2eba61d5 117#define PKT_PROT_LEN 128
f942dc25 118
ea066ad1
IC
119static u16 frag_get_pending_idx(skb_frag_t *frag)
120{
121 return (u16)frag->page_offset;
122}
123
124static void frag_set_pending_idx(skb_frag_t *frag, u16 pending_idx)
125{
126 frag->page_offset = pending_idx;
127}
128
f942dc25
IC
129static inline pending_ring_idx_t pending_index(unsigned i)
130{
131 return i & (MAX_PENDING_REQS-1);
132}
133
b3f980bd 134static inline pending_ring_idx_t nr_pending_reqs(struct xenvif *vif)
f942dc25
IC
135{
136 return MAX_PENDING_REQS -
b3f980bd 137 vif->pending_prod + vif->pending_cons;
f942dc25
IC
138}
139
140static int max_required_rx_slots(struct xenvif *vif)
141{
142 int max = DIV_ROUND_UP(vif->dev->mtu, PAGE_SIZE);
143
2810e5b9 144 /* XXX FIXME: RX path dependent on MAX_SKB_FRAGS */
f942dc25
IC
145 if (vif->can_sg || vif->gso || vif->gso_prefix)
146 max += MAX_SKB_FRAGS + 1; /* extra_info + frags */
147
148 return max;
149}
150
7376419a 151int xenvif_rx_ring_full(struct xenvif *vif)
f942dc25
IC
152{
153 RING_IDX peek = vif->rx_req_cons_peek;
154 RING_IDX needed = max_required_rx_slots(vif);
155
156 return ((vif->rx.sring->req_prod - peek) < needed) ||
157 ((vif->rx.rsp_prod_pvt + XEN_NETIF_RX_RING_SIZE - peek) < needed);
158}
159
7376419a 160int xenvif_must_stop_queue(struct xenvif *vif)
f942dc25 161{
7376419a 162 if (!xenvif_rx_ring_full(vif))
f942dc25
IC
163 return 0;
164
165 vif->rx.sring->req_event = vif->rx_req_cons_peek +
166 max_required_rx_slots(vif);
167 mb(); /* request notification /then/ check the queue */
168
7376419a 169 return xenvif_rx_ring_full(vif);
f942dc25
IC
170}
171
172/*
173 * Returns true if we should start a new receive buffer instead of
174 * adding 'size' bytes to a buffer which currently contains 'offset'
175 * bytes.
176 */
177static bool start_new_rx_buffer(int offset, unsigned long size, int head)
178{
179 /* simple case: we have completely filled the current buffer. */
180 if (offset == MAX_BUFFER_OFFSET)
181 return true;
182
183 /*
184 * complex case: start a fresh buffer if the current frag
185 * would overflow the current buffer but only if:
186 * (i) this frag would fit completely in the next buffer
187 * and (ii) there is already some data in the current buffer
188 * and (iii) this is not the head buffer.
189 *
190 * Where:
191 * - (i) stops us splitting a frag into two copies
192 * unless the frag is too large for a single buffer.
193 * - (ii) stops us from leaving a buffer pointlessly empty.
194 * - (iii) stops us leaving the first buffer
195 * empty. Strictly speaking this is already covered
196 * by (ii) but is explicitly checked because
197 * netfront relies on the first buffer being
198 * non-empty and can crash otherwise.
199 *
200 * This means we will effectively linearise small
201 * frags but do not needlessly split large buffers
202 * into multiple copies tend to give large frags their
203 * own buffers as before.
204 */
205 if ((offset + size > MAX_BUFFER_OFFSET) &&
206 (size <= MAX_BUFFER_OFFSET) && offset && !head)
207 return true;
208
209 return false;
210}
211
33bc801d
WL
212struct xenvif_count_slot_state {
213 unsigned long copy_off;
214 bool head;
215};
216
217unsigned int xenvif_count_frag_slots(struct xenvif *vif,
218 unsigned long offset, unsigned long size,
219 struct xenvif_count_slot_state *state)
220{
221 unsigned count = 0;
222
223 offset &= ~PAGE_MASK;
224
225 while (size > 0) {
226 unsigned long bytes;
227
228 bytes = PAGE_SIZE - offset;
229
230 if (bytes > size)
231 bytes = size;
232
233 if (start_new_rx_buffer(state->copy_off, bytes, state->head)) {
234 count++;
235 state->copy_off = 0;
236 }
237
238 if (state->copy_off + bytes > MAX_BUFFER_OFFSET)
239 bytes = MAX_BUFFER_OFFSET - state->copy_off;
240
241 state->copy_off += bytes;
242
243 offset += bytes;
244 size -= bytes;
245
246 if (offset == PAGE_SIZE)
247 offset = 0;
248
249 state->head = false;
250 }
251
252 return count;
253}
254
f942dc25
IC
255/*
256 * Figure out how many ring slots we're going to need to send @skb to
257 * the guest. This function is essentially a dry run of
7376419a 258 * xenvif_gop_frag_copy.
f942dc25 259 */
7376419a 260unsigned int xenvif_count_skb_slots(struct xenvif *vif, struct sk_buff *skb)
f942dc25 261{
33bc801d 262 struct xenvif_count_slot_state state;
f942dc25 263 unsigned int count;
33bc801d
WL
264 unsigned char *data;
265 unsigned i;
f942dc25 266
33bc801d
WL
267 state.head = true;
268 state.copy_off = 0;
f942dc25 269
33bc801d
WL
270 /* Slot for the first (partial) page of data. */
271 count = 1;
f942dc25 272
33bc801d 273 /* Need a slot for the GSO prefix for GSO extra data? */
f942dc25
IC
274 if (skb_shinfo(skb)->gso_size)
275 count++;
276
33bc801d
WL
277 data = skb->data;
278 while (data < skb_tail_pointer(skb)) {
279 unsigned long offset = offset_in_page(data);
280 unsigned long size = PAGE_SIZE - offset;
4f0581d2 281
33bc801d
WL
282 if (data + size > skb_tail_pointer(skb))
283 size = skb_tail_pointer(skb) - data;
6a8ed462 284
33bc801d 285 count += xenvif_count_frag_slots(vif, offset, size, &state);
4f0581d2 286
33bc801d
WL
287 data += size;
288 }
4f0581d2 289
33bc801d
WL
290 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
291 unsigned long size = skb_frag_size(&skb_shinfo(skb)->frags[i]);
292 unsigned long offset = skb_shinfo(skb)->frags[i].page_offset;
4f0581d2 293
33bc801d 294 count += xenvif_count_frag_slots(vif, offset, size, &state);
f942dc25
IC
295 }
296 return count;
297}
298
299struct netrx_pending_operations {
300 unsigned copy_prod, copy_cons;
301 unsigned meta_prod, meta_cons;
302 struct gnttab_copy *copy;
b3f980bd 303 struct xenvif_rx_meta *meta;
f942dc25
IC
304 int copy_off;
305 grant_ref_t copy_gref;
306};
307
b3f980bd
WL
308static struct xenvif_rx_meta *get_next_rx_buffer(struct xenvif *vif,
309 struct netrx_pending_operations *npo)
f942dc25 310{
b3f980bd 311 struct xenvif_rx_meta *meta;
f942dc25
IC
312 struct xen_netif_rx_request *req;
313
314 req = RING_GET_REQUEST(&vif->rx, vif->rx.req_cons++);
315
316 meta = npo->meta + npo->meta_prod++;
317 meta->gso_size = 0;
318 meta->size = 0;
319 meta->id = req->id;
320
321 npo->copy_off = 0;
322 npo->copy_gref = req->gref;
323
324 return meta;
325}
326
33bc801d
WL
327/*
328 * Set up the grant operations for this fragment. If it's a flipping
329 * interface, we also set up the unmap request from here.
330 */
7376419a
WL
331static void xenvif_gop_frag_copy(struct xenvif *vif, struct sk_buff *skb,
332 struct netrx_pending_operations *npo,
333 struct page *page, unsigned long size,
33bc801d 334 unsigned long offset, int *head)
f942dc25
IC
335{
336 struct gnttab_copy *copy_gop;
b3f980bd 337 struct xenvif_rx_meta *meta;
f942dc25
IC
338 unsigned long bytes;
339
340 /* Data must not cross a page boundary. */
6a8ed462 341 BUG_ON(size + offset > PAGE_SIZE<<compound_order(page));
f942dc25
IC
342
343 meta = npo->meta + npo->meta_prod - 1;
344
6a8ed462
IC
345 /* Skip unused frames from start of page */
346 page += offset >> PAGE_SHIFT;
347 offset &= ~PAGE_MASK;
348
f942dc25 349 while (size > 0) {
6a8ed462 350 BUG_ON(offset >= PAGE_SIZE);
f942dc25
IC
351 BUG_ON(npo->copy_off > MAX_BUFFER_OFFSET);
352
6a8ed462
IC
353 bytes = PAGE_SIZE - offset;
354
355 if (bytes > size)
356 bytes = size;
357
33bc801d 358 if (start_new_rx_buffer(npo->copy_off, bytes, *head)) {
f942dc25
IC
359 /*
360 * Netfront requires there to be some data in the head
361 * buffer.
362 */
33bc801d 363 BUG_ON(*head);
f942dc25
IC
364
365 meta = get_next_rx_buffer(vif, npo);
366 }
367
f942dc25
IC
368 if (npo->copy_off + bytes > MAX_BUFFER_OFFSET)
369 bytes = MAX_BUFFER_OFFSET - npo->copy_off;
370
371 copy_gop = npo->copy + npo->copy_prod++;
372 copy_gop->flags = GNTCOPY_dest_gref;
b3f980bd
WL
373 copy_gop->len = bytes;
374
43e9d194
WL
375 copy_gop->source.domid = DOMID_SELF;
376 copy_gop->source.u.gmfn = virt_to_mfn(page_address(page));
f942dc25 377 copy_gop->source.offset = offset;
f942dc25 378
b3f980bd 379 copy_gop->dest.domid = vif->domid;
f942dc25
IC
380 copy_gop->dest.offset = npo->copy_off;
381 copy_gop->dest.u.ref = npo->copy_gref;
f942dc25
IC
382
383 npo->copy_off += bytes;
384 meta->size += bytes;
385
386 offset += bytes;
387 size -= bytes;
388
6a8ed462
IC
389 /* Next frame */
390 if (offset == PAGE_SIZE && size) {
391 BUG_ON(!PageCompound(page));
392 page++;
393 offset = 0;
394 }
395
f942dc25 396 /* Leave a gap for the GSO descriptor. */
33bc801d 397 if (*head && skb_shinfo(skb)->gso_size && !vif->gso_prefix)
f942dc25
IC
398 vif->rx.req_cons++;
399
33bc801d 400 *head = 0; /* There must be something in this buffer now. */
f942dc25
IC
401
402 }
403}
404
405/*
406 * Prepare an SKB to be transmitted to the frontend.
407 *
408 * This function is responsible for allocating grant operations, meta
409 * structures, etc.
410 *
411 * It returns the number of meta structures consumed. The number of
412 * ring slots used is always equal to the number of meta slots used
413 * plus the number of GSO descriptors used. Currently, we use either
414 * zero GSO descriptors (for non-GSO packets) or one descriptor (for
415 * frontend-side LRO).
416 */
7376419a
WL
417static int xenvif_gop_skb(struct sk_buff *skb,
418 struct netrx_pending_operations *npo)
f942dc25
IC
419{
420 struct xenvif *vif = netdev_priv(skb->dev);
421 int nr_frags = skb_shinfo(skb)->nr_frags;
422 int i;
423 struct xen_netif_rx_request *req;
b3f980bd 424 struct xenvif_rx_meta *meta;
f942dc25 425 unsigned char *data;
33bc801d 426 int head = 1;
f942dc25
IC
427 int old_meta_prod;
428
429 old_meta_prod = npo->meta_prod;
430
431 /* Set up a GSO prefix descriptor, if necessary */
432 if (skb_shinfo(skb)->gso_size && vif->gso_prefix) {
433 req = RING_GET_REQUEST(&vif->rx, vif->rx.req_cons++);
434 meta = npo->meta + npo->meta_prod++;
435 meta->gso_size = skb_shinfo(skb)->gso_size;
436 meta->size = 0;
437 meta->id = req->id;
438 }
439
440 req = RING_GET_REQUEST(&vif->rx, vif->rx.req_cons++);
441 meta = npo->meta + npo->meta_prod++;
442
443 if (!vif->gso_prefix)
444 meta->gso_size = skb_shinfo(skb)->gso_size;
445 else
446 meta->gso_size = 0;
447
448 meta->size = 0;
449 meta->id = req->id;
450 npo->copy_off = 0;
451 npo->copy_gref = req->gref;
452
453 data = skb->data;
454 while (data < skb_tail_pointer(skb)) {
455 unsigned int offset = offset_in_page(data);
456 unsigned int len = PAGE_SIZE - offset;
457
458 if (data + len > skb_tail_pointer(skb))
459 len = skb_tail_pointer(skb) - data;
460
7376419a 461 xenvif_gop_frag_copy(vif, skb, npo,
33bc801d 462 virt_to_page(data), len, offset, &head);
f942dc25
IC
463 data += len;
464 }
465
466 for (i = 0; i < nr_frags; i++) {
7376419a
WL
467 xenvif_gop_frag_copy(vif, skb, npo,
468 skb_frag_page(&skb_shinfo(skb)->frags[i]),
469 skb_frag_size(&skb_shinfo(skb)->frags[i]),
470 skb_shinfo(skb)->frags[i].page_offset,
33bc801d 471 &head);
f942dc25
IC
472 }
473
474 return npo->meta_prod - old_meta_prod;
475}
476
477/*
7376419a 478 * This is a twin to xenvif_gop_skb. Assume that xenvif_gop_skb was
f942dc25
IC
479 * used to set up the operations on the top of
480 * netrx_pending_operations, which have since been done. Check that
481 * they didn't give any errors and advance over them.
482 */
7376419a
WL
483static int xenvif_check_gop(struct xenvif *vif, int nr_meta_slots,
484 struct netrx_pending_operations *npo)
f942dc25
IC
485{
486 struct gnttab_copy *copy_op;
487 int status = XEN_NETIF_RSP_OKAY;
488 int i;
489
490 for (i = 0; i < nr_meta_slots; i++) {
491 copy_op = npo->copy + npo->copy_cons++;
492 if (copy_op->status != GNTST_okay) {
493 netdev_dbg(vif->dev,
494 "Bad status %d from copy to DOM%d.\n",
495 copy_op->status, vif->domid);
496 status = XEN_NETIF_RSP_ERROR;
497 }
498 }
499
500 return status;
501}
502
7376419a
WL
503static void xenvif_add_frag_responses(struct xenvif *vif, int status,
504 struct xenvif_rx_meta *meta,
505 int nr_meta_slots)
f942dc25
IC
506{
507 int i;
508 unsigned long offset;
509
510 /* No fragments used */
511 if (nr_meta_slots <= 1)
512 return;
513
514 nr_meta_slots--;
515
516 for (i = 0; i < nr_meta_slots; i++) {
517 int flags;
518 if (i == nr_meta_slots - 1)
519 flags = 0;
520 else
521 flags = XEN_NETRXF_more_data;
522
523 offset = 0;
524 make_rx_response(vif, meta[i].id, status, offset,
525 meta[i].size, flags);
526 }
527}
528
33bc801d
WL
529struct skb_cb_overlay {
530 int meta_slots_used;
531};
532
7376419a 533static void xenvif_kick_thread(struct xenvif *vif)
b3f980bd
WL
534{
535 wake_up(&vif->wq);
536}
537
7376419a 538void xenvif_rx_action(struct xenvif *vif)
f942dc25 539{
f942dc25 540 s8 status;
e1f00a69 541 u16 flags;
f942dc25
IC
542 struct xen_netif_rx_response *resp;
543 struct sk_buff_head rxq;
544 struct sk_buff *skb;
545 LIST_HEAD(notify);
546 int ret;
547 int nr_frags;
548 int count;
549 unsigned long offset;
550 struct skb_cb_overlay *sco;
b3f980bd 551 int need_to_notify = 0;
f942dc25
IC
552
553 struct netrx_pending_operations npo = {
b3f980bd
WL
554 .copy = vif->grant_copy_op,
555 .meta = vif->meta,
f942dc25
IC
556 };
557
558 skb_queue_head_init(&rxq);
559
560 count = 0;
561
b3f980bd 562 while ((skb = skb_dequeue(&vif->rx_queue)) != NULL) {
f942dc25
IC
563 vif = netdev_priv(skb->dev);
564 nr_frags = skb_shinfo(skb)->nr_frags;
565
566 sco = (struct skb_cb_overlay *)skb->cb;
7376419a 567 sco->meta_slots_used = xenvif_gop_skb(skb, &npo);
f942dc25 568
33bc801d 569 count += nr_frags + 1;
f942dc25
IC
570
571 __skb_queue_tail(&rxq, skb);
572
573 /* Filled the batch queue? */
33bc801d
WL
574 /* XXX FIXME: RX path dependent on MAX_SKB_FRAGS */
575 if (count + MAX_SKB_FRAGS >= XEN_NETIF_RX_RING_SIZE)
f942dc25
IC
576 break;
577 }
578
b3f980bd 579 BUG_ON(npo.meta_prod > ARRAY_SIZE(vif->meta));
f942dc25
IC
580
581 if (!npo.copy_prod)
582 return;
583
b3f980bd
WL
584 BUG_ON(npo.copy_prod > ARRAY_SIZE(vif->grant_copy_op));
585 gnttab_batch_copy(vif->grant_copy_op, npo.copy_prod);
f942dc25
IC
586
587 while ((skb = __skb_dequeue(&rxq)) != NULL) {
588 sco = (struct skb_cb_overlay *)skb->cb;
589
590 vif = netdev_priv(skb->dev);
591
b3f980bd 592 if (vif->meta[npo.meta_cons].gso_size && vif->gso_prefix) {
f942dc25 593 resp = RING_GET_RESPONSE(&vif->rx,
b3f980bd 594 vif->rx.rsp_prod_pvt++);
f942dc25
IC
595
596 resp->flags = XEN_NETRXF_gso_prefix | XEN_NETRXF_more_data;
597
b3f980bd
WL
598 resp->offset = vif->meta[npo.meta_cons].gso_size;
599 resp->id = vif->meta[npo.meta_cons].id;
f942dc25
IC
600 resp->status = sco->meta_slots_used;
601
602 npo.meta_cons++;
603 sco->meta_slots_used--;
604 }
605
606
607 vif->dev->stats.tx_bytes += skb->len;
608 vif->dev->stats.tx_packets++;
609
7376419a 610 status = xenvif_check_gop(vif, sco->meta_slots_used, &npo);
f942dc25
IC
611
612 if (sco->meta_slots_used == 1)
613 flags = 0;
614 else
615 flags = XEN_NETRXF_more_data;
616
617 if (skb->ip_summed == CHECKSUM_PARTIAL) /* local packet? */
618 flags |= XEN_NETRXF_csum_blank | XEN_NETRXF_data_validated;
619 else if (skb->ip_summed == CHECKSUM_UNNECESSARY)
620 /* remote but checksummed. */
621 flags |= XEN_NETRXF_data_validated;
622
623 offset = 0;
b3f980bd 624 resp = make_rx_response(vif, vif->meta[npo.meta_cons].id,
f942dc25 625 status, offset,
b3f980bd 626 vif->meta[npo.meta_cons].size,
f942dc25
IC
627 flags);
628
b3f980bd 629 if (vif->meta[npo.meta_cons].gso_size && !vif->gso_prefix) {
f942dc25
IC
630 struct xen_netif_extra_info *gso =
631 (struct xen_netif_extra_info *)
632 RING_GET_RESPONSE(&vif->rx,
633 vif->rx.rsp_prod_pvt++);
634
635 resp->flags |= XEN_NETRXF_extra_info;
636
b3f980bd 637 gso->u.gso.size = vif->meta[npo.meta_cons].gso_size;
f942dc25
IC
638 gso->u.gso.type = XEN_NETIF_GSO_TYPE_TCPV4;
639 gso->u.gso.pad = 0;
640 gso->u.gso.features = 0;
641
642 gso->type = XEN_NETIF_EXTRA_TYPE_GSO;
643 gso->flags = 0;
644 }
645
7376419a
WL
646 xenvif_add_frag_responses(vif, status,
647 vif->meta + npo.meta_cons + 1,
648 sco->meta_slots_used);
f942dc25
IC
649
650 RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(&vif->rx, ret);
f942dc25 651
b3f980bd
WL
652 if (ret)
653 need_to_notify = 1;
654
f942dc25
IC
655 xenvif_notify_tx_completion(vif);
656
f942dc25
IC
657 npo.meta_cons += sco->meta_slots_used;
658 dev_kfree_skb(skb);
659 }
660
b3f980bd 661 if (need_to_notify)
e1f00a69 662 notify_remote_via_irq(vif->rx_irq);
f942dc25
IC
663
664 /* More work to do? */
b3f980bd 665 if (!skb_queue_empty(&vif->rx_queue))
7376419a 666 xenvif_kick_thread(vif);
f942dc25
IC
667}
668
7376419a 669void xenvif_queue_tx_skb(struct xenvif *vif, struct sk_buff *skb)
f942dc25 670{
b3f980bd 671 skb_queue_tail(&vif->rx_queue, skb);
f942dc25 672
7376419a 673 xenvif_kick_thread(vif);
f942dc25
IC
674}
675
7376419a 676void xenvif_check_rx_xenvif(struct xenvif *vif)
f942dc25
IC
677{
678 int more_to_do;
679
680 RING_FINAL_CHECK_FOR_REQUESTS(&vif->tx, more_to_do);
681
682 if (more_to_do)
b3f980bd 683 napi_schedule(&vif->napi);
f942dc25
IC
684}
685
686static void tx_add_credit(struct xenvif *vif)
687{
688 unsigned long max_burst, max_credit;
689
690 /*
691 * Allow a burst big enough to transmit a jumbo packet of up to 128kB.
692 * Otherwise the interface can seize up due to insufficient credit.
693 */
694 max_burst = RING_GET_REQUEST(&vif->tx, vif->tx.req_cons)->size;
695 max_burst = min(max_burst, 131072UL);
696 max_burst = max(max_burst, vif->credit_bytes);
697
698 /* Take care that adding a new chunk of credit doesn't wrap to zero. */
699 max_credit = vif->remaining_credit + vif->credit_bytes;
700 if (max_credit < vif->remaining_credit)
701 max_credit = ULONG_MAX; /* wrapped: clamp to ULONG_MAX */
702
703 vif->remaining_credit = min(max_credit, max_burst);
704}
705
706static void tx_credit_callback(unsigned long data)
707{
708 struct xenvif *vif = (struct xenvif *)data;
709 tx_add_credit(vif);
7376419a 710 xenvif_check_rx_xenvif(vif);
f942dc25
IC
711}
712
7376419a
WL
713static void xenvif_tx_err(struct xenvif *vif,
714 struct xen_netif_tx_request *txp, RING_IDX end)
f942dc25
IC
715{
716 RING_IDX cons = vif->tx.req_cons;
717
718 do {
719 make_tx_response(vif, txp, XEN_NETIF_RSP_ERROR);
b9149729 720 if (cons == end)
f942dc25
IC
721 break;
722 txp = RING_GET_REQUEST(&vif->tx, cons++);
723 } while (1);
724 vif->tx.req_cons = cons;
f942dc25
IC
725}
726
7376419a 727static void xenvif_fatal_tx_err(struct xenvif *vif)
48856286
IC
728{
729 netdev_err(vif->dev, "fatal error; disabling device\n");
730 xenvif_carrier_off(vif);
48856286
IC
731}
732
7376419a
WL
733static int xenvif_count_requests(struct xenvif *vif,
734 struct xen_netif_tx_request *first,
735 struct xen_netif_tx_request *txp,
736 int work_to_do)
f942dc25
IC
737{
738 RING_IDX cons = vif->tx.req_cons;
2810e5b9
WL
739 int slots = 0;
740 int drop_err = 0;
59ccb4eb 741 int more_data;
f942dc25
IC
742
743 if (!(first->flags & XEN_NETTXF_more_data))
744 return 0;
745
746 do {
59ccb4eb
WL
747 struct xen_netif_tx_request dropped_tx = { 0 };
748
2810e5b9
WL
749 if (slots >= work_to_do) {
750 netdev_err(vif->dev,
751 "Asked for %d slots but exceeds this limit\n",
752 work_to_do);
7376419a 753 xenvif_fatal_tx_err(vif);
35876b5f 754 return -ENODATA;
f942dc25
IC
755 }
756
2810e5b9
WL
757 /* This guest is really using too many slots and
758 * considered malicious.
759 */
37641494 760 if (unlikely(slots >= fatal_skb_slots)) {
2810e5b9
WL
761 netdev_err(vif->dev,
762 "Malicious frontend using %d slots, threshold %u\n",
37641494 763 slots, fatal_skb_slots);
7376419a 764 xenvif_fatal_tx_err(vif);
35876b5f 765 return -E2BIG;
f942dc25
IC
766 }
767
2810e5b9 768 /* Xen network protocol had implicit dependency on
37641494
WL
769 * MAX_SKB_FRAGS. XEN_NETBK_LEGACY_SLOTS_MAX is set to
770 * the historical MAX_SKB_FRAGS value 18 to honor the
771 * same behavior as before. Any packet using more than
772 * 18 slots but less than fatal_skb_slots slots is
773 * dropped
2810e5b9 774 */
37641494 775 if (!drop_err && slots >= XEN_NETBK_LEGACY_SLOTS_MAX) {
2810e5b9
WL
776 if (net_ratelimit())
777 netdev_dbg(vif->dev,
778 "Too many slots (%d) exceeding limit (%d), dropping packet\n",
37641494 779 slots, XEN_NETBK_LEGACY_SLOTS_MAX);
2810e5b9
WL
780 drop_err = -E2BIG;
781 }
782
59ccb4eb
WL
783 if (drop_err)
784 txp = &dropped_tx;
785
2810e5b9 786 memcpy(txp, RING_GET_REQUEST(&vif->tx, cons + slots),
f942dc25 787 sizeof(*txp));
03393fd5
WL
788
789 /* If the guest submitted a frame >= 64 KiB then
790 * first->size overflowed and following slots will
791 * appear to be larger than the frame.
792 *
793 * This cannot be fatal error as there are buggy
794 * frontends that do this.
795 *
796 * Consume all slots and drop the packet.
797 */
798 if (!drop_err && txp->size > first->size) {
799 if (net_ratelimit())
800 netdev_dbg(vif->dev,
801 "Invalid tx request, slot size %u > remaining size %u\n",
802 txp->size, first->size);
803 drop_err = -EIO;
f942dc25
IC
804 }
805
806 first->size -= txp->size;
2810e5b9 807 slots++;
f942dc25
IC
808
809 if (unlikely((txp->offset + txp->size) > PAGE_SIZE)) {
2810e5b9 810 netdev_err(vif->dev, "Cross page boundary, txp->offset: %x, size: %u\n",
f942dc25 811 txp->offset, txp->size);
7376419a 812 xenvif_fatal_tx_err(vif);
35876b5f 813 return -EINVAL;
f942dc25 814 }
59ccb4eb
WL
815
816 more_data = txp->flags & XEN_NETTXF_more_data;
817
818 if (!drop_err)
819 txp++;
820
821 } while (more_data);
2810e5b9
WL
822
823 if (drop_err) {
7376419a 824 xenvif_tx_err(vif, first, cons + slots);
2810e5b9
WL
825 return drop_err;
826 }
827
828 return slots;
f942dc25
IC
829}
830
7376419a
WL
831static struct page *xenvif_alloc_page(struct xenvif *vif,
832 u16 pending_idx)
f942dc25
IC
833{
834 struct page *page;
b3f980bd
WL
835
836 page = alloc_page(GFP_ATOMIC|__GFP_COLD);
f942dc25
IC
837 if (!page)
838 return NULL;
b3f980bd
WL
839 vif->mmap_pages[pending_idx] = page;
840
f942dc25
IC
841 return page;
842}
843
7376419a
WL
844static struct gnttab_copy *xenvif_get_requests(struct xenvif *vif,
845 struct sk_buff *skb,
846 struct xen_netif_tx_request *txp,
847 struct gnttab_copy *gop)
f942dc25
IC
848{
849 struct skb_shared_info *shinfo = skb_shinfo(skb);
850 skb_frag_t *frags = shinfo->frags;
ea066ad1 851 u16 pending_idx = *((u16 *)skb->data);
2810e5b9
WL
852 u16 head_idx = 0;
853 int slot, start;
854 struct page *page;
855 pending_ring_idx_t index, start_idx = 0;
856 uint16_t dst_offset;
857 unsigned int nr_slots;
858 struct pending_tx_info *first = NULL;
859
860 /* At this point shinfo->nr_frags is in fact the number of
37641494 861 * slots, which can be as large as XEN_NETBK_LEGACY_SLOTS_MAX.
2810e5b9
WL
862 */
863 nr_slots = shinfo->nr_frags;
f942dc25
IC
864
865 /* Skip first skb fragment if it is on same page as header fragment. */
ea066ad1 866 start = (frag_get_pending_idx(&shinfo->frags[0]) == pending_idx);
f942dc25 867
2810e5b9
WL
868 /* Coalesce tx requests, at this point the packet passed in
869 * should be <= 64K. Any packets larger than 64K have been
7376419a 870 * handled in xenvif_count_requests().
2810e5b9
WL
871 */
872 for (shinfo->nr_frags = slot = start; slot < nr_slots;
873 shinfo->nr_frags++) {
f942dc25 874 struct pending_tx_info *pending_tx_info =
b3f980bd 875 vif->pending_tx_info;
f942dc25 876
b3f980bd 877 page = alloc_page(GFP_ATOMIC|__GFP_COLD);
f942dc25 878 if (!page)
4cc7c1cb 879 goto err;
f942dc25 880
2810e5b9
WL
881 dst_offset = 0;
882 first = NULL;
883 while (dst_offset < PAGE_SIZE && slot < nr_slots) {
884 gop->flags = GNTCOPY_source_gref;
885
886 gop->source.u.ref = txp->gref;
887 gop->source.domid = vif->domid;
888 gop->source.offset = txp->offset;
889
890 gop->dest.domid = DOMID_SELF;
891
892 gop->dest.offset = dst_offset;
893 gop->dest.u.gmfn = virt_to_mfn(page_address(page));
894
895 if (dst_offset + txp->size > PAGE_SIZE) {
896 /* This page can only merge a portion
897 * of tx request. Do not increment any
898 * pointer / counter here. The txp
899 * will be dealt with in future
900 * rounds, eventually hitting the
901 * `else` branch.
902 */
903 gop->len = PAGE_SIZE - dst_offset;
904 txp->offset += gop->len;
905 txp->size -= gop->len;
906 dst_offset += gop->len; /* quit loop */
907 } else {
908 /* This tx request can be merged in the page */
909 gop->len = txp->size;
910 dst_offset += gop->len;
911
b3f980bd 912 index = pending_index(vif->pending_cons++);
2810e5b9 913
b3f980bd 914 pending_idx = vif->pending_ring[index];
2810e5b9
WL
915
916 memcpy(&pending_tx_info[pending_idx].req, txp,
917 sizeof(*txp));
2810e5b9
WL
918
919 /* Poison these fields, corresponding
920 * fields for head tx req will be set
921 * to correct values after the loop.
922 */
b3f980bd 923 vif->mmap_pages[pending_idx] = (void *)(~0UL);
2810e5b9
WL
924 pending_tx_info[pending_idx].head =
925 INVALID_PENDING_RING_IDX;
926
927 if (!first) {
928 first = &pending_tx_info[pending_idx];
929 start_idx = index;
930 head_idx = pending_idx;
931 }
932
933 txp++;
934 slot++;
935 }
f942dc25 936
2810e5b9
WL
937 gop++;
938 }
f942dc25 939
2810e5b9
WL
940 first->req.offset = 0;
941 first->req.size = dst_offset;
942 first->head = start_idx;
b3f980bd 943 vif->mmap_pages[head_idx] = page;
2810e5b9 944 frag_set_pending_idx(&frags[shinfo->nr_frags], head_idx);
f942dc25
IC
945 }
946
2810e5b9
WL
947 BUG_ON(shinfo->nr_frags > MAX_SKB_FRAGS);
948
f942dc25 949 return gop;
4cc7c1cb
IC
950err:
951 /* Unwind, freeing all pages and sending error responses. */
2810e5b9 952 while (shinfo->nr_frags-- > start) {
7376419a 953 xenvif_idx_release(vif,
2810e5b9
WL
954 frag_get_pending_idx(&frags[shinfo->nr_frags]),
955 XEN_NETIF_RSP_ERROR);
4cc7c1cb
IC
956 }
957 /* The head too, if necessary. */
958 if (start)
7376419a 959 xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_ERROR);
4cc7c1cb
IC
960
961 return NULL;
f942dc25
IC
962}
963
7376419a
WL
964static int xenvif_tx_check_gop(struct xenvif *vif,
965 struct sk_buff *skb,
966 struct gnttab_copy **gopp)
f942dc25
IC
967{
968 struct gnttab_copy *gop = *gopp;
ea066ad1 969 u16 pending_idx = *((u16 *)skb->data);
f942dc25 970 struct skb_shared_info *shinfo = skb_shinfo(skb);
2810e5b9 971 struct pending_tx_info *tx_info;
f942dc25
IC
972 int nr_frags = shinfo->nr_frags;
973 int i, err, start;
2810e5b9 974 u16 peek; /* peek into next tx request */
f942dc25
IC
975
976 /* Check status of header. */
977 err = gop->status;
7d5145d8 978 if (unlikely(err))
7376419a 979 xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_ERROR);
f942dc25
IC
980
981 /* Skip first skb fragment if it is on same page as header fragment. */
ea066ad1 982 start = (frag_get_pending_idx(&shinfo->frags[0]) == pending_idx);
f942dc25
IC
983
984 for (i = start; i < nr_frags; i++) {
985 int j, newerr;
2810e5b9 986 pending_ring_idx_t head;
f942dc25 987
ea066ad1 988 pending_idx = frag_get_pending_idx(&shinfo->frags[i]);
b3f980bd 989 tx_info = &vif->pending_tx_info[pending_idx];
2810e5b9 990 head = tx_info->head;
f942dc25
IC
991
992 /* Check error status: if okay then remember grant handle. */
2810e5b9
WL
993 do {
994 newerr = (++gop)->status;
995 if (newerr)
996 break;
b3f980bd
WL
997 peek = vif->pending_ring[pending_index(++head)];
998 } while (!pending_tx_is_head(vif, peek));
2810e5b9 999
f942dc25
IC
1000 if (likely(!newerr)) {
1001 /* Had a previous error? Invalidate this fragment. */
1002 if (unlikely(err))
7376419a
WL
1003 xenvif_idx_release(vif, pending_idx,
1004 XEN_NETIF_RSP_OKAY);
f942dc25
IC
1005 continue;
1006 }
1007
1008 /* Error on this fragment: respond to client with an error. */
7376419a 1009 xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_ERROR);
f942dc25
IC
1010
1011 /* Not the first error? Preceding frags already invalidated. */
1012 if (err)
1013 continue;
1014
1015 /* First error: invalidate header and preceding fragments. */
1016 pending_idx = *((u16 *)skb->data);
7376419a 1017 xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_OKAY);
f942dc25 1018 for (j = start; j < i; j++) {
5ccb3ea7 1019 pending_idx = frag_get_pending_idx(&shinfo->frags[j]);
7376419a
WL
1020 xenvif_idx_release(vif, pending_idx,
1021 XEN_NETIF_RSP_OKAY);
f942dc25
IC
1022 }
1023
1024 /* Remember the error: invalidate all subsequent fragments. */
1025 err = newerr;
1026 }
1027
1028 *gopp = gop + 1;
1029 return err;
1030}
1031
7376419a 1032static void xenvif_fill_frags(struct xenvif *vif, struct sk_buff *skb)
f942dc25
IC
1033{
1034 struct skb_shared_info *shinfo = skb_shinfo(skb);
1035 int nr_frags = shinfo->nr_frags;
1036 int i;
1037
1038 for (i = 0; i < nr_frags; i++) {
1039 skb_frag_t *frag = shinfo->frags + i;
1040 struct xen_netif_tx_request *txp;
ea066ad1
IC
1041 struct page *page;
1042 u16 pending_idx;
f942dc25 1043
ea066ad1 1044 pending_idx = frag_get_pending_idx(frag);
f942dc25 1045
b3f980bd
WL
1046 txp = &vif->pending_tx_info[pending_idx].req;
1047 page = virt_to_page(idx_to_kaddr(vif, pending_idx));
ea066ad1 1048 __skb_fill_page_desc(skb, i, page, txp->offset, txp->size);
f942dc25
IC
1049 skb->len += txp->size;
1050 skb->data_len += txp->size;
1051 skb->truesize += txp->size;
1052
7376419a 1053 /* Take an extra reference to offset xenvif_idx_release */
b3f980bd 1054 get_page(vif->mmap_pages[pending_idx]);
7376419a 1055 xenvif_idx_release(vif, pending_idx, XEN_NETIF_RSP_OKAY);
f942dc25
IC
1056 }
1057}
1058
7376419a 1059static int xenvif_get_extras(struct xenvif *vif,
f942dc25
IC
1060 struct xen_netif_extra_info *extras,
1061 int work_to_do)
1062{
1063 struct xen_netif_extra_info extra;
1064 RING_IDX cons = vif->tx.req_cons;
1065
1066 do {
1067 if (unlikely(work_to_do-- <= 0)) {
48856286 1068 netdev_err(vif->dev, "Missing extra info\n");
7376419a 1069 xenvif_fatal_tx_err(vif);
f942dc25
IC
1070 return -EBADR;
1071 }
1072
1073 memcpy(&extra, RING_GET_REQUEST(&vif->tx, cons),
1074 sizeof(extra));
1075 if (unlikely(!extra.type ||
1076 extra.type >= XEN_NETIF_EXTRA_TYPE_MAX)) {
1077 vif->tx.req_cons = ++cons;
48856286 1078 netdev_err(vif->dev,
f942dc25 1079 "Invalid extra type: %d\n", extra.type);
7376419a 1080 xenvif_fatal_tx_err(vif);
f942dc25
IC
1081 return -EINVAL;
1082 }
1083
1084 memcpy(&extras[extra.type - 1], &extra, sizeof(extra));
1085 vif->tx.req_cons = ++cons;
1086 } while (extra.flags & XEN_NETIF_EXTRA_FLAG_MORE);
1087
1088 return work_to_do;
1089}
1090
7376419a
WL
1091static int xenvif_set_skb_gso(struct xenvif *vif,
1092 struct sk_buff *skb,
1093 struct xen_netif_extra_info *gso)
f942dc25
IC
1094{
1095 if (!gso->u.gso.size) {
48856286 1096 netdev_err(vif->dev, "GSO size must not be zero.\n");
7376419a 1097 xenvif_fatal_tx_err(vif);
f942dc25
IC
1098 return -EINVAL;
1099 }
1100
a9468587
PD
1101 switch (gso->u.gso.type) {
1102 case XEN_NETIF_GSO_TYPE_TCPV4:
1103 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
1104 break;
1105 case XEN_NETIF_GSO_TYPE_TCPV6:
1106 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
1107 break;
1108 default:
48856286 1109 netdev_err(vif->dev, "Bad GSO type %d.\n", gso->u.gso.type);
7376419a 1110 xenvif_fatal_tx_err(vif);
f942dc25
IC
1111 return -EINVAL;
1112 }
1113
1114 skb_shinfo(skb)->gso_size = gso->u.gso.size;
f942dc25
IC
1115
1116 /* Header must be checked, and gso_segs computed. */
1117 skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
1118 skb_shinfo(skb)->gso_segs = 0;
1119
1120 return 0;
1121}
1122
2eba61d5
PD
1123static inline void maybe_pull_tail(struct sk_buff *skb, unsigned int len)
1124{
1125 if (skb_is_nonlinear(skb) && skb_headlen(skb) < len) {
1126 /* If we need to pullup then pullup to the max, so we
1127 * won't need to do it again.
1128 */
1129 int target = min_t(int, skb->len, MAX_TCP_HEADER);
1130 __pskb_pull_tail(skb, target - skb_headlen(skb));
1131 }
1132}
1133
1134static int checksum_setup_ip(struct xenvif *vif, struct sk_buff *skb,
1135 int recalculate_partial_csum)
f942dc25 1136{
2eba61d5
PD
1137 struct iphdr *iph = (void *)skb->data;
1138 unsigned int header_size;
1139 unsigned int off;
f942dc25 1140 int err = -EPROTO;
f942dc25 1141
2eba61d5 1142 off = sizeof(struct iphdr);
f942dc25 1143
2eba61d5
PD
1144 header_size = skb->network_header + off + MAX_IPOPTLEN;
1145 maybe_pull_tail(skb, header_size);
f942dc25 1146
2eba61d5 1147 off = iph->ihl * 4;
f942dc25 1148
f942dc25
IC
1149 switch (iph->protocol) {
1150 case IPPROTO_TCP:
2eba61d5 1151 if (!skb_partial_csum_set(skb, off,
bea89336
JW
1152 offsetof(struct tcphdr, check)))
1153 goto out;
f942dc25
IC
1154
1155 if (recalculate_partial_csum) {
bea89336 1156 struct tcphdr *tcph = tcp_hdr(skb);
2eba61d5
PD
1157
1158 header_size = skb->network_header +
1159 off +
1160 sizeof(struct tcphdr);
1161 maybe_pull_tail(skb, header_size);
1162
f942dc25 1163 tcph->check = ~csum_tcpudp_magic(iph->saddr, iph->daddr,
2eba61d5 1164 skb->len - off,
f942dc25
IC
1165 IPPROTO_TCP, 0);
1166 }
1167 break;
1168 case IPPROTO_UDP:
2eba61d5 1169 if (!skb_partial_csum_set(skb, off,
bea89336
JW
1170 offsetof(struct udphdr, check)))
1171 goto out;
f942dc25
IC
1172
1173 if (recalculate_partial_csum) {
bea89336 1174 struct udphdr *udph = udp_hdr(skb);
2eba61d5
PD
1175
1176 header_size = skb->network_header +
1177 off +
1178 sizeof(struct udphdr);
1179 maybe_pull_tail(skb, header_size);
1180
f942dc25 1181 udph->check = ~csum_tcpudp_magic(iph->saddr, iph->daddr,
2eba61d5 1182 skb->len - off,
f942dc25
IC
1183 IPPROTO_UDP, 0);
1184 }
1185 break;
1186 default:
1187 if (net_ratelimit())
1188 netdev_err(vif->dev,
2eba61d5
PD
1189 "Attempting to checksum a non-TCP/UDP packet, "
1190 "dropping a protocol %d packet\n",
f942dc25
IC
1191 iph->protocol);
1192 goto out;
1193 }
1194
f942dc25
IC
1195 err = 0;
1196
1197out:
1198 return err;
1199}
1200
2eba61d5
PD
1201static int checksum_setup_ipv6(struct xenvif *vif, struct sk_buff *skb,
1202 int recalculate_partial_csum)
1203{
1204 int err = -EPROTO;
1205 struct ipv6hdr *ipv6h = (void *)skb->data;
1206 u8 nexthdr;
1207 unsigned int header_size;
1208 unsigned int off;
1209 bool fragment;
1210 bool done;
1211
1212 done = false;
1213
1214 off = sizeof(struct ipv6hdr);
1215
1216 header_size = skb->network_header + off;
1217 maybe_pull_tail(skb, header_size);
1218
1219 nexthdr = ipv6h->nexthdr;
1220
1221 while ((off <= sizeof(struct ipv6hdr) + ntohs(ipv6h->payload_len)) &&
1222 !done) {
1223 switch (nexthdr) {
1224 case IPPROTO_DSTOPTS:
1225 case IPPROTO_HOPOPTS:
1226 case IPPROTO_ROUTING: {
1227 struct ipv6_opt_hdr *hp = (void *)(skb->data + off);
1228
1229 header_size = skb->network_header +
1230 off +
1231 sizeof(struct ipv6_opt_hdr);
1232 maybe_pull_tail(skb, header_size);
1233
1234 nexthdr = hp->nexthdr;
1235 off += ipv6_optlen(hp);
1236 break;
1237 }
1238 case IPPROTO_AH: {
1239 struct ip_auth_hdr *hp = (void *)(skb->data + off);
1240
1241 header_size = skb->network_header +
1242 off +
1243 sizeof(struct ip_auth_hdr);
1244 maybe_pull_tail(skb, header_size);
1245
1246 nexthdr = hp->nexthdr;
1247 off += (hp->hdrlen+2)<<2;
1248 break;
1249 }
1250 case IPPROTO_FRAGMENT:
1251 fragment = true;
1252 /* fall through */
1253 default:
1254 done = true;
1255 break;
1256 }
1257 }
1258
1259 if (!done) {
1260 if (net_ratelimit())
1261 netdev_err(vif->dev, "Failed to parse packet header\n");
1262 goto out;
1263 }
1264
1265 if (fragment) {
1266 if (net_ratelimit())
1267 netdev_err(vif->dev, "Packet is a fragment!\n");
1268 goto out;
1269 }
1270
1271 switch (nexthdr) {
1272 case IPPROTO_TCP:
1273 if (!skb_partial_csum_set(skb, off,
1274 offsetof(struct tcphdr, check)))
1275 goto out;
1276
1277 if (recalculate_partial_csum) {
1278 struct tcphdr *tcph = tcp_hdr(skb);
1279
1280 header_size = skb->network_header +
1281 off +
1282 sizeof(struct tcphdr);
1283 maybe_pull_tail(skb, header_size);
1284
1285 tcph->check = ~csum_ipv6_magic(&ipv6h->saddr,
1286 &ipv6h->daddr,
1287 skb->len - off,
1288 IPPROTO_TCP, 0);
1289 }
1290 break;
1291 case IPPROTO_UDP:
1292 if (!skb_partial_csum_set(skb, off,
1293 offsetof(struct udphdr, check)))
1294 goto out;
1295
1296 if (recalculate_partial_csum) {
1297 struct udphdr *udph = udp_hdr(skb);
1298
1299 header_size = skb->network_header +
1300 off +
1301 sizeof(struct udphdr);
1302 maybe_pull_tail(skb, header_size);
1303
1304 udph->check = ~csum_ipv6_magic(&ipv6h->saddr,
1305 &ipv6h->daddr,
1306 skb->len - off,
1307 IPPROTO_UDP, 0);
1308 }
1309 break;
1310 default:
1311 if (net_ratelimit())
1312 netdev_err(vif->dev,
1313 "Attempting to checksum a non-TCP/UDP packet, "
1314 "dropping a protocol %d packet\n",
1315 nexthdr);
1316 goto out;
1317 }
1318
1319 err = 0;
1320
1321out:
1322 return err;
1323}
1324
1325static int checksum_setup(struct xenvif *vif, struct sk_buff *skb)
1326{
1327 int err = -EPROTO;
1328 int recalculate_partial_csum = 0;
1329
1330 /* A GSO SKB must be CHECKSUM_PARTIAL. However some buggy
1331 * peers can fail to set NETRXF_csum_blank when sending a GSO
1332 * frame. In this case force the SKB to CHECKSUM_PARTIAL and
1333 * recalculate the partial checksum.
1334 */
1335 if (skb->ip_summed != CHECKSUM_PARTIAL && skb_is_gso(skb)) {
1336 vif->rx_gso_checksum_fixup++;
1337 skb->ip_summed = CHECKSUM_PARTIAL;
1338 recalculate_partial_csum = 1;
1339 }
1340
1341 /* A non-CHECKSUM_PARTIAL SKB does not require setup. */
1342 if (skb->ip_summed != CHECKSUM_PARTIAL)
1343 return 0;
1344
1345 if (skb->protocol == htons(ETH_P_IP))
1346 err = checksum_setup_ip(vif, skb, recalculate_partial_csum);
1347 else if (skb->protocol == htons(ETH_P_IPV6))
1348 err = checksum_setup_ipv6(vif, skb, recalculate_partial_csum);
1349
1350 return err;
1351}
1352
f942dc25
IC
1353static bool tx_credit_exceeded(struct xenvif *vif, unsigned size)
1354{
1355 unsigned long now = jiffies;
1356 unsigned long next_credit =
1357 vif->credit_timeout.expires +
1358 msecs_to_jiffies(vif->credit_usec / 1000);
1359
1360 /* Timer could already be pending in rare cases. */
1361 if (timer_pending(&vif->credit_timeout))
1362 return true;
1363
1364 /* Passed the point where we can replenish credit? */
1365 if (time_after_eq(now, next_credit)) {
1366 vif->credit_timeout.expires = now;
1367 tx_add_credit(vif);
1368 }
1369
1370 /* Still too big to send right now? Set a callback. */
1371 if (size > vif->remaining_credit) {
1372 vif->credit_timeout.data =
1373 (unsigned long)vif;
1374 vif->credit_timeout.function =
1375 tx_credit_callback;
1376 mod_timer(&vif->credit_timeout,
1377 next_credit);
1378
1379 return true;
1380 }
1381
1382 return false;
1383}
1384
7376419a 1385static unsigned xenvif_tx_build_gops(struct xenvif *vif)
f942dc25 1386{
b3f980bd 1387 struct gnttab_copy *gop = vif->tx_copy_ops, *request_gop;
f942dc25
IC
1388 struct sk_buff *skb;
1389 int ret;
1390
b3f980bd
WL
1391 while ((nr_pending_reqs(vif) + XEN_NETBK_LEGACY_SLOTS_MAX
1392 < MAX_PENDING_REQS)) {
f942dc25 1393 struct xen_netif_tx_request txreq;
37641494 1394 struct xen_netif_tx_request txfrags[XEN_NETBK_LEGACY_SLOTS_MAX];
f942dc25
IC
1395 struct page *page;
1396 struct xen_netif_extra_info extras[XEN_NETIF_EXTRA_TYPE_MAX-1];
1397 u16 pending_idx;
1398 RING_IDX idx;
1399 int work_to_do;
1400 unsigned int data_len;
1401 pending_ring_idx_t index;
1402
48856286
IC
1403 if (vif->tx.sring->req_prod - vif->tx.req_cons >
1404 XEN_NETIF_TX_RING_SIZE) {
1405 netdev_err(vif->dev,
1406 "Impossible number of requests. "
1407 "req_prod %d, req_cons %d, size %ld\n",
1408 vif->tx.sring->req_prod, vif->tx.req_cons,
1409 XEN_NETIF_TX_RING_SIZE);
7376419a 1410 xenvif_fatal_tx_err(vif);
48856286
IC
1411 continue;
1412 }
1413
f942dc25 1414 RING_FINAL_CHECK_FOR_REQUESTS(&vif->tx, work_to_do);
b3f980bd
WL
1415 if (!work_to_do)
1416 break;
f942dc25
IC
1417
1418 idx = vif->tx.req_cons;
1419 rmb(); /* Ensure that we see the request before we copy it. */
1420 memcpy(&txreq, RING_GET_REQUEST(&vif->tx, idx), sizeof(txreq));
1421
1422 /* Credit-based scheduling. */
1423 if (txreq.size > vif->remaining_credit &&
b3f980bd
WL
1424 tx_credit_exceeded(vif, txreq.size))
1425 break;
f942dc25
IC
1426
1427 vif->remaining_credit -= txreq.size;
1428
1429 work_to_do--;
1430 vif->tx.req_cons = ++idx;
1431
1432 memset(extras, 0, sizeof(extras));
1433 if (txreq.flags & XEN_NETTXF_extra_info) {
7376419a
WL
1434 work_to_do = xenvif_get_extras(vif, extras,
1435 work_to_do);
f942dc25 1436 idx = vif->tx.req_cons;
48856286 1437 if (unlikely(work_to_do < 0))
b3f980bd 1438 break;
f942dc25
IC
1439 }
1440
7376419a 1441 ret = xenvif_count_requests(vif, &txreq, txfrags, work_to_do);
48856286 1442 if (unlikely(ret < 0))
b3f980bd 1443 break;
48856286 1444
f942dc25
IC
1445 idx += ret;
1446
1447 if (unlikely(txreq.size < ETH_HLEN)) {
1448 netdev_dbg(vif->dev,
1449 "Bad packet size: %d\n", txreq.size);
7376419a 1450 xenvif_tx_err(vif, &txreq, idx);
b3f980bd 1451 break;
f942dc25
IC
1452 }
1453
1454 /* No crossing a page as the payload mustn't fragment. */
1455 if (unlikely((txreq.offset + txreq.size) > PAGE_SIZE)) {
48856286 1456 netdev_err(vif->dev,
f942dc25
IC
1457 "txreq.offset: %x, size: %u, end: %lu\n",
1458 txreq.offset, txreq.size,
1459 (txreq.offset&~PAGE_MASK) + txreq.size);
7376419a 1460 xenvif_fatal_tx_err(vif);
b3f980bd 1461 break;
f942dc25
IC
1462 }
1463
b3f980bd
WL
1464 index = pending_index(vif->pending_cons);
1465 pending_idx = vif->pending_ring[index];
f942dc25
IC
1466
1467 data_len = (txreq.size > PKT_PROT_LEN &&
37641494 1468 ret < XEN_NETBK_LEGACY_SLOTS_MAX) ?
f942dc25
IC
1469 PKT_PROT_LEN : txreq.size;
1470
1471 skb = alloc_skb(data_len + NET_SKB_PAD + NET_IP_ALIGN,
1472 GFP_ATOMIC | __GFP_NOWARN);
1473 if (unlikely(skb == NULL)) {
1474 netdev_dbg(vif->dev,
1475 "Can't allocate a skb in start_xmit.\n");
7376419a 1476 xenvif_tx_err(vif, &txreq, idx);
f942dc25
IC
1477 break;
1478 }
1479
1480 /* Packets passed to netif_rx() must have some headroom. */
1481 skb_reserve(skb, NET_SKB_PAD + NET_IP_ALIGN);
1482
1483 if (extras[XEN_NETIF_EXTRA_TYPE_GSO - 1].type) {
1484 struct xen_netif_extra_info *gso;
1485 gso = &extras[XEN_NETIF_EXTRA_TYPE_GSO - 1];
1486
7376419a
WL
1487 if (xenvif_set_skb_gso(vif, skb, gso)) {
1488 /* Failure in xenvif_set_skb_gso is fatal. */
f942dc25 1489 kfree_skb(skb);
b3f980bd 1490 break;
f942dc25
IC
1491 }
1492 }
1493
1494 /* XXX could copy straight to head */
7376419a 1495 page = xenvif_alloc_page(vif, pending_idx);
f942dc25
IC
1496 if (!page) {
1497 kfree_skb(skb);
7376419a 1498 xenvif_tx_err(vif, &txreq, idx);
b3f980bd 1499 break;
f942dc25
IC
1500 }
1501
f942dc25
IC
1502 gop->source.u.ref = txreq.gref;
1503 gop->source.domid = vif->domid;
1504 gop->source.offset = txreq.offset;
1505
1506 gop->dest.u.gmfn = virt_to_mfn(page_address(page));
1507 gop->dest.domid = DOMID_SELF;
1508 gop->dest.offset = txreq.offset;
1509
1510 gop->len = txreq.size;
1511 gop->flags = GNTCOPY_source_gref;
1512
1513 gop++;
1514
b3f980bd 1515 memcpy(&vif->pending_tx_info[pending_idx].req,
f942dc25 1516 &txreq, sizeof(txreq));
b3f980bd 1517 vif->pending_tx_info[pending_idx].head = index;
f942dc25
IC
1518 *((u16 *)skb->data) = pending_idx;
1519
1520 __skb_put(skb, data_len);
1521
1522 skb_shinfo(skb)->nr_frags = ret;
1523 if (data_len < txreq.size) {
1524 skb_shinfo(skb)->nr_frags++;
ea066ad1
IC
1525 frag_set_pending_idx(&skb_shinfo(skb)->frags[0],
1526 pending_idx);
f942dc25 1527 } else {
ea066ad1
IC
1528 frag_set_pending_idx(&skb_shinfo(skb)->frags[0],
1529 INVALID_PENDING_IDX);
f942dc25
IC
1530 }
1531
b3f980bd 1532 vif->pending_cons++;
f942dc25 1533
7376419a 1534 request_gop = xenvif_get_requests(vif, skb, txfrags, gop);
f942dc25
IC
1535 if (request_gop == NULL) {
1536 kfree_skb(skb);
7376419a 1537 xenvif_tx_err(vif, &txreq, idx);
b3f980bd 1538 break;
f942dc25
IC
1539 }
1540 gop = request_gop;
1541
b3f980bd 1542 __skb_queue_tail(&vif->tx_queue, skb);
1e0b6eac 1543
f942dc25 1544 vif->tx.req_cons = idx;
f942dc25 1545
b3f980bd 1546 if ((gop-vif->tx_copy_ops) >= ARRAY_SIZE(vif->tx_copy_ops))
f942dc25
IC
1547 break;
1548 }
1549
b3f980bd 1550 return gop - vif->tx_copy_ops;
f942dc25
IC
1551}
1552
b3f980bd 1553
7376419a 1554static int xenvif_tx_submit(struct xenvif *vif, int budget)
f942dc25 1555{
b3f980bd 1556 struct gnttab_copy *gop = vif->tx_copy_ops;
f942dc25 1557 struct sk_buff *skb;
b3f980bd 1558 int work_done = 0;
f942dc25 1559
b3f980bd
WL
1560 while (work_done < budget &&
1561 (skb = __skb_dequeue(&vif->tx_queue)) != NULL) {
f942dc25 1562 struct xen_netif_tx_request *txp;
f942dc25
IC
1563 u16 pending_idx;
1564 unsigned data_len;
1565
1566 pending_idx = *((u16 *)skb->data);
b3f980bd 1567 txp = &vif->pending_tx_info[pending_idx].req;
f942dc25
IC
1568
1569 /* Check the remap error code. */
7376419a 1570 if (unlikely(xenvif_tx_check_gop(vif, skb, &gop))) {
f942dc25
IC
1571 netdev_dbg(vif->dev, "netback grant failed.\n");
1572 skb_shinfo(skb)->nr_frags = 0;
1573 kfree_skb(skb);
1574 continue;
1575 }
1576
1577 data_len = skb->len;
1578 memcpy(skb->data,
b3f980bd 1579 (void *)(idx_to_kaddr(vif, pending_idx)|txp->offset),
f942dc25
IC
1580 data_len);
1581 if (data_len < txp->size) {
1582 /* Append the packet payload as a fragment. */
1583 txp->offset += data_len;
1584 txp->size -= data_len;
1585 } else {
1586 /* Schedule a response immediately. */
7376419a
WL
1587 xenvif_idx_release(vif, pending_idx,
1588 XEN_NETIF_RSP_OKAY);
f942dc25
IC
1589 }
1590
1591 if (txp->flags & XEN_NETTXF_csum_blank)
1592 skb->ip_summed = CHECKSUM_PARTIAL;
1593 else if (txp->flags & XEN_NETTXF_data_validated)
1594 skb->ip_summed = CHECKSUM_UNNECESSARY;
1595
7376419a 1596 xenvif_fill_frags(vif, skb);
f942dc25 1597
2eba61d5 1598 if (skb_is_nonlinear(skb) && skb_headlen(skb) < PKT_PROT_LEN) {
f942dc25
IC
1599 int target = min_t(int, skb->len, PKT_PROT_LEN);
1600 __pskb_pull_tail(skb, target - skb_headlen(skb));
1601 }
1602
1603 skb->dev = vif->dev;
1604 skb->protocol = eth_type_trans(skb, skb->dev);
f9ca8f74 1605 skb_reset_network_header(skb);
f942dc25
IC
1606
1607 if (checksum_setup(vif, skb)) {
1608 netdev_dbg(vif->dev,
1609 "Can't setup checksum in net_tx_action\n");
1610 kfree_skb(skb);
1611 continue;
1612 }
1613
40893fd0 1614 skb_probe_transport_header(skb, 0);
f9ca8f74 1615
f942dc25
IC
1616 vif->dev->stats.rx_bytes += skb->len;
1617 vif->dev->stats.rx_packets++;
1618
b3f980bd
WL
1619 work_done++;
1620
1621 netif_receive_skb(skb);
f942dc25 1622 }
b3f980bd
WL
1623
1624 return work_done;
f942dc25
IC
1625}
1626
1627/* Called after netfront has transmitted */
7376419a 1628int xenvif_tx_action(struct xenvif *vif, int budget)
f942dc25
IC
1629{
1630 unsigned nr_gops;
b3f980bd 1631 int work_done;
f942dc25 1632
b3f980bd
WL
1633 if (unlikely(!tx_work_todo(vif)))
1634 return 0;
1635
7376419a 1636 nr_gops = xenvif_tx_build_gops(vif);
f942dc25
IC
1637
1638 if (nr_gops == 0)
b3f980bd
WL
1639 return 0;
1640
1641 gnttab_batch_copy(vif->tx_copy_ops, nr_gops);
f942dc25 1642
7376419a 1643 work_done = xenvif_tx_submit(vif, nr_gops);
f942dc25 1644
b3f980bd 1645 return work_done;
f942dc25
IC
1646}
1647
7376419a
WL
1648static void xenvif_idx_release(struct xenvif *vif, u16 pending_idx,
1649 u8 status)
f942dc25 1650{
f942dc25 1651 struct pending_tx_info *pending_tx_info;
2810e5b9
WL
1652 pending_ring_idx_t head;
1653 u16 peek; /* peek into next tx request */
1654
b3f980bd 1655 BUG_ON(vif->mmap_pages[pending_idx] == (void *)(~0UL));
f942dc25
IC
1656
1657 /* Already complete? */
b3f980bd 1658 if (vif->mmap_pages[pending_idx] == NULL)
f942dc25
IC
1659 return;
1660
b3f980bd 1661 pending_tx_info = &vif->pending_tx_info[pending_idx];
f942dc25 1662
2810e5b9 1663 head = pending_tx_info->head;
f942dc25 1664
b3f980bd
WL
1665 BUG_ON(!pending_tx_is_head(vif, head));
1666 BUG_ON(vif->pending_ring[pending_index(head)] != pending_idx);
f942dc25 1667
2810e5b9
WL
1668 do {
1669 pending_ring_idx_t index;
1670 pending_ring_idx_t idx = pending_index(head);
b3f980bd 1671 u16 info_idx = vif->pending_ring[idx];
f942dc25 1672
b3f980bd 1673 pending_tx_info = &vif->pending_tx_info[info_idx];
2810e5b9
WL
1674 make_tx_response(vif, &pending_tx_info->req, status);
1675
1676 /* Setting any number other than
1677 * INVALID_PENDING_RING_IDX indicates this slot is
1678 * starting a new packet / ending a previous packet.
1679 */
1680 pending_tx_info->head = 0;
1681
b3f980bd
WL
1682 index = pending_index(vif->pending_prod++);
1683 vif->pending_ring[index] = vif->pending_ring[info_idx];
f942dc25 1684
b3f980bd 1685 peek = vif->pending_ring[pending_index(++head)];
2810e5b9 1686
b3f980bd 1687 } while (!pending_tx_is_head(vif, peek));
2810e5b9 1688
b3f980bd
WL
1689 put_page(vif->mmap_pages[pending_idx]);
1690 vif->mmap_pages[pending_idx] = NULL;
f942dc25
IC
1691}
1692
2810e5b9 1693
f942dc25
IC
1694static void make_tx_response(struct xenvif *vif,
1695 struct xen_netif_tx_request *txp,
1696 s8 st)
1697{
1698 RING_IDX i = vif->tx.rsp_prod_pvt;
1699 struct xen_netif_tx_response *resp;
1700 int notify;
1701
1702 resp = RING_GET_RESPONSE(&vif->tx, i);
1703 resp->id = txp->id;
1704 resp->status = st;
1705
1706 if (txp->flags & XEN_NETTXF_extra_info)
1707 RING_GET_RESPONSE(&vif->tx, ++i)->status = XEN_NETIF_RSP_NULL;
1708
1709 vif->tx.rsp_prod_pvt = ++i;
1710 RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(&vif->tx, notify);
1711 if (notify)
e1f00a69 1712 notify_remote_via_irq(vif->tx_irq);
f942dc25
IC
1713}
1714
1715static struct xen_netif_rx_response *make_rx_response(struct xenvif *vif,
1716 u16 id,
1717 s8 st,
1718 u16 offset,
1719 u16 size,
1720 u16 flags)
1721{
1722 RING_IDX i = vif->rx.rsp_prod_pvt;
1723 struct xen_netif_rx_response *resp;
1724
1725 resp = RING_GET_RESPONSE(&vif->rx, i);
1726 resp->offset = offset;
1727 resp->flags = flags;
1728 resp->id = id;
1729 resp->status = (s16)size;
1730 if (st < 0)
1731 resp->status = (s16)st;
1732
1733 vif->rx.rsp_prod_pvt = ++i;
1734
1735 return resp;
1736}
1737
b3f980bd 1738static inline int rx_work_todo(struct xenvif *vif)
f942dc25 1739{
b3f980bd 1740 return !skb_queue_empty(&vif->rx_queue);
f942dc25
IC
1741}
1742
b3f980bd 1743static inline int tx_work_todo(struct xenvif *vif)
f942dc25
IC
1744{
1745
b3f980bd
WL
1746 if (likely(RING_HAS_UNCONSUMED_REQUESTS(&vif->tx)) &&
1747 (nr_pending_reqs(vif) + XEN_NETBK_LEGACY_SLOTS_MAX
1748 < MAX_PENDING_REQS))
f942dc25
IC
1749 return 1;
1750
1751 return 0;
1752}
1753
7376419a 1754void xenvif_unmap_frontend_rings(struct xenvif *vif)
f942dc25 1755{
c9d63699
DV
1756 if (vif->tx.sring)
1757 xenbus_unmap_ring_vfree(xenvif_to_xenbus_device(vif),
1758 vif->tx.sring);
1759 if (vif->rx.sring)
1760 xenbus_unmap_ring_vfree(xenvif_to_xenbus_device(vif),
1761 vif->rx.sring);
f942dc25
IC
1762}
1763
7376419a
WL
1764int xenvif_map_frontend_rings(struct xenvif *vif,
1765 grant_ref_t tx_ring_ref,
1766 grant_ref_t rx_ring_ref)
f942dc25 1767{
c9d63699 1768 void *addr;
f942dc25
IC
1769 struct xen_netif_tx_sring *txs;
1770 struct xen_netif_rx_sring *rxs;
1771
1772 int err = -ENOMEM;
1773
c9d63699
DV
1774 err = xenbus_map_ring_valloc(xenvif_to_xenbus_device(vif),
1775 tx_ring_ref, &addr);
1776 if (err)
f942dc25
IC
1777 goto err;
1778
c9d63699 1779 txs = (struct xen_netif_tx_sring *)addr;
f942dc25
IC
1780 BACK_RING_INIT(&vif->tx, txs, PAGE_SIZE);
1781
c9d63699
DV
1782 err = xenbus_map_ring_valloc(xenvif_to_xenbus_device(vif),
1783 rx_ring_ref, &addr);
1784 if (err)
f942dc25 1785 goto err;
f942dc25 1786
c9d63699 1787 rxs = (struct xen_netif_rx_sring *)addr;
f942dc25
IC
1788 BACK_RING_INIT(&vif->rx, rxs, PAGE_SIZE);
1789
c9d63699
DV
1790 vif->rx_req_cons_peek = 0;
1791
f942dc25
IC
1792 return 0;
1793
1794err:
7376419a 1795 xenvif_unmap_frontend_rings(vif);
f942dc25
IC
1796 return err;
1797}
1798
7376419a 1799int xenvif_kthread(void *data)
b3f980bd
WL
1800{
1801 struct xenvif *vif = data;
1802
1803 while (!kthread_should_stop()) {
1804 wait_event_interruptible(vif->wq,
1805 rx_work_todo(vif) ||
1806 kthread_should_stop());
1807 if (kthread_should_stop())
1808 break;
1809
1810 if (rx_work_todo(vif))
7376419a 1811 xenvif_rx_action(vif);
b3f980bd
WL
1812
1813 cond_resched();
1814 }
1815
1816 return 0;
1817}
1818
f942dc25
IC
1819static int __init netback_init(void)
1820{
f942dc25 1821 int rc = 0;
f942dc25 1822
2a14b244 1823 if (!xen_domain())
f942dc25
IC
1824 return -ENODEV;
1825
37641494 1826 if (fatal_skb_slots < XEN_NETBK_LEGACY_SLOTS_MAX) {
383eda32
JP
1827 pr_info("fatal_skb_slots too small (%d), bump it to XEN_NETBK_LEGACY_SLOTS_MAX (%d)\n",
1828 fatal_skb_slots, XEN_NETBK_LEGACY_SLOTS_MAX);
37641494 1829 fatal_skb_slots = XEN_NETBK_LEGACY_SLOTS_MAX;
2810e5b9
WL
1830 }
1831
f942dc25
IC
1832 rc = xenvif_xenbus_init();
1833 if (rc)
1834 goto failed_init;
1835
1836 return 0;
1837
1838failed_init:
f942dc25 1839 return rc;
f942dc25
IC
1840}
1841
1842module_init(netback_init);
1843
b103f358
WL
1844static void __exit netback_fini(void)
1845{
b103f358 1846 xenvif_xenbus_fini();
b103f358
WL
1847}
1848module_exit(netback_fini);
1849
f942dc25 1850MODULE_LICENSE("Dual BSD/GPL");
f984cec6 1851MODULE_ALIAS("xen-backend:vif");