Commit | Line | Data |
---|---|---|
3b20eb23 | 1 | // SPDX-License-Identifier: GPL-2.0-only |
3e7ee490 | 2 | /* |
3e7ee490 HJ |
3 | * Copyright (c) 2009, Microsoft Corporation. |
4 | * | |
3e7ee490 HJ |
5 | * Authors: |
6 | * Haiyang Zhang <haiyangz@microsoft.com> | |
7 | * Hank Janssen <hjanssen@microsoft.com> | |
3e7ee490 | 8 | */ |
0a46618d HJ |
9 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt |
10 | ||
5654e932 | 11 | #include <linux/kernel.h> |
0c3b7b2f S |
12 | #include <linux/sched.h> |
13 | #include <linux/wait.h> | |
a0086dc5 | 14 | #include <linux/mm.h> |
5a0e3ad6 | 15 | #include <linux/slab.h> |
c88c4e4c | 16 | #include <linux/module.h> |
46a97191 | 17 | #include <linux/hyperv.h> |
011a7c3c | 18 | #include <linux/uio.h> |
63d55b2a | 19 | #include <linux/interrupt.h> |
6ba34171 | 20 | #include <asm/page.h> |
5bf74682 | 21 | #include <asm/mshyperv.h> |
3f335ea2 | 22 | |
0f2a6619 | 23 | #include "hyperv_vmbus.h" |
3e7ee490 | 24 | |
c1135c7f BF |
25 | /* |
26 | * hv_gpadl_size - Return the real size of a gpadl, the size that Hyper-V uses | |
27 | * | |
28 | * For BUFFER gpadl, Hyper-V uses the exact same size as the guest does. | |
29 | * | |
30 | * For RING gpadl, in each ring, the guest uses one PAGE_SIZE as the header | |
31 | * (because of the alignment requirement), however, the hypervisor only | |
32 | * uses the first HV_HYP_PAGE_SIZE as the header, therefore leaving a | |
33 | * (PAGE_SIZE - HV_HYP_PAGE_SIZE) gap. And since there are two rings in a | |
34 | * ringbuffer, the total size for a RING gpadl that Hyper-V uses is the | |
35 | * total size that the guest uses minus twice of the gap size. | |
36 | */ | |
37 | static inline u32 hv_gpadl_size(enum hv_gpadl_type type, u32 size) | |
38 | { | |
39 | switch (type) { | |
40 | case HV_GPADL_BUFFER: | |
41 | return size; | |
42 | case HV_GPADL_RING: | |
43 | /* The size of a ringbuffer must be page-aligned */ | |
44 | BUG_ON(size % PAGE_SIZE); | |
45 | /* | |
46 | * Two things to notice here: | |
47 | * 1) We're processing two ring buffers as a unit | |
48 | * 2) We're skipping any space larger than HV_HYP_PAGE_SIZE in | |
49 | * the first guest-size page of each of the two ring buffers. | |
50 | * So we effectively subtract out two guest-size pages, and add | |
51 | * back two Hyper-V size pages. | |
52 | */ | |
53 | return size - 2 * (PAGE_SIZE - HV_HYP_PAGE_SIZE); | |
54 | } | |
55 | BUG(); | |
56 | return 0; | |
57 | } | |
58 | ||
59 | /* | |
60 | * hv_ring_gpadl_send_hvpgoffset - Calculate the send offset (in unit of | |
61 | * HV_HYP_PAGE) in a ring gpadl based on the | |
62 | * offset in the guest | |
63 | * | |
64 | * @offset: the offset (in bytes) where the send ringbuffer starts in the | |
65 | * virtual address space of the guest | |
66 | */ | |
67 | static inline u32 hv_ring_gpadl_send_hvpgoffset(u32 offset) | |
68 | { | |
69 | ||
70 | /* | |
71 | * For RING gpadl, in each ring, the guest uses one PAGE_SIZE as the | |
72 | * header (because of the alignment requirement), however, the | |
73 | * hypervisor only uses the first HV_HYP_PAGE_SIZE as the header, | |
74 | * therefore leaving a (PAGE_SIZE - HV_HYP_PAGE_SIZE) gap. | |
75 | * | |
76 | * And to calculate the effective send offset in gpadl, we need to | |
77 | * substract this gap. | |
78 | */ | |
79 | return (offset - (PAGE_SIZE - HV_HYP_PAGE_SIZE)) >> HV_HYP_PAGE_SHIFT; | |
80 | } | |
81 | ||
82 | /* | |
83 | * hv_gpadl_hvpfn - Return the Hyper-V page PFN of the @i th Hyper-V page in | |
84 | * the gpadl | |
85 | * | |
86 | * @type: the type of the gpadl | |
87 | * @kbuffer: the pointer to the gpadl in the guest | |
88 | * @size: the total size (in bytes) of the gpadl | |
89 | * @send_offset: the offset (in bytes) where the send ringbuffer starts in the | |
90 | * virtual address space of the guest | |
91 | * @i: the index | |
92 | */ | |
93 | static inline u64 hv_gpadl_hvpfn(enum hv_gpadl_type type, void *kbuffer, | |
94 | u32 size, u32 send_offset, int i) | |
95 | { | |
96 | int send_idx = hv_ring_gpadl_send_hvpgoffset(send_offset); | |
97 | unsigned long delta = 0UL; | |
98 | ||
99 | switch (type) { | |
100 | case HV_GPADL_BUFFER: | |
101 | break; | |
102 | case HV_GPADL_RING: | |
103 | if (i == 0) | |
104 | delta = 0; | |
105 | else if (i <= send_idx) | |
106 | delta = PAGE_SIZE - HV_HYP_PAGE_SIZE; | |
107 | else | |
108 | delta = 2 * (PAGE_SIZE - HV_HYP_PAGE_SIZE); | |
109 | break; | |
110 | default: | |
111 | BUG(); | |
112 | break; | |
113 | } | |
114 | ||
115 | return virt_to_hvpfn(kbuffer + delta + (HV_HYP_PAGE_SIZE * i)); | |
116 | } | |
117 | ||
3e189519 | 118 | /* |
fff41b2e | 119 | * vmbus_setevent- Trigger an event notification on the specified |
3e189519 | 120 | * channel. |
f4266e34 | 121 | */ |
1f6ee4e7 | 122 | void vmbus_setevent(struct vmbus_channel *channel) |
3e7ee490 | 123 | { |
39d70a4a | 124 | struct hv_monitor_page *monitorpage; |
3e7ee490 | 125 | |
991f8f1c VK |
126 | trace_vmbus_setevent(channel); |
127 | ||
3724287c S |
128 | /* |
129 | * For channels marked as in "low latency" mode | |
130 | * bypass the monitor page mechanism. | |
131 | */ | |
5c1bec61 SH |
132 | if (channel->offermsg.monitor_allocated && !channel->low_latency) { |
133 | vmbus_send_interrupt(channel->offermsg.child_relid); | |
3e7ee490 | 134 | |
8681db44 GKH |
135 | /* Get the child to parent monitor page */ |
136 | monitorpage = vmbus_connection.monitor_pages[1]; | |
3e7ee490 | 137 | |
22356585 | 138 | sync_set_bit(channel->monitor_bit, |
f6feebe0 HZ |
139 | (unsigned long *)&monitorpage->trigger_group |
140 | [channel->monitor_grp].pending); | |
7c369f40 | 141 | |
f4266e34 | 142 | } else { |
21c3bef5 | 143 | vmbus_set_event(channel); |
3e7ee490 | 144 | } |
3e7ee490 | 145 | } |
1f6ee4e7 | 146 | EXPORT_SYMBOL_GPL(vmbus_setevent); |
3e7ee490 | 147 | |
ae6935ed SH |
148 | /* vmbus_free_ring - drop mapping of ring buffer */ |
149 | void vmbus_free_ring(struct vmbus_channel *channel) | |
3e7ee490 | 150 | { |
ae6935ed SH |
151 | hv_ringbuffer_cleanup(&channel->outbound); |
152 | hv_ringbuffer_cleanup(&channel->inbound); | |
3e7ee490 | 153 | |
ae6935ed SH |
154 | if (channel->ringbuffer_page) { |
155 | __free_pages(channel->ringbuffer_page, | |
156 | get_order(channel->ringbuffer_pagecount | |
157 | << PAGE_SHIFT)); | |
158 | channel->ringbuffer_page = NULL; | |
159 | } | |
160 | } | |
161 | EXPORT_SYMBOL_GPL(vmbus_free_ring); | |
98f531b1 | 162 | |
ae6935ed SH |
163 | /* vmbus_alloc_ring - allocate and map pages for ring buffer */ |
164 | int vmbus_alloc_ring(struct vmbus_channel *newchannel, | |
165 | u32 send_size, u32 recv_size) | |
166 | { | |
167 | struct page *page; | |
168 | int order; | |
52a42c2a | 169 | |
ae6935ed | 170 | if (send_size % PAGE_SIZE || recv_size % PAGE_SIZE) |
e68d2971 | 171 | return -EINVAL; |
3e7ee490 | 172 | |
454f18a9 | 173 | /* Allocate the ring buffer */ |
ae6935ed | 174 | order = get_order(send_size + recv_size); |
294409d2 | 175 | page = alloc_pages_node(cpu_to_node(newchannel->target_cpu), |
52a42c2a | 176 | GFP_KERNEL|__GFP_ZERO, order); |
294409d2 S |
177 | |
178 | if (!page) | |
52a42c2a | 179 | page = alloc_pages(GFP_KERNEL|__GFP_ZERO, order); |
df3493e0 | 180 | |
ae6935ed SH |
181 | if (!page) |
182 | return -ENOMEM; | |
3e7ee490 | 183 | |
52a42c2a | 184 | newchannel->ringbuffer_page = page; |
ae6935ed SH |
185 | newchannel->ringbuffer_pagecount = (send_size + recv_size) >> PAGE_SHIFT; |
186 | newchannel->ringbuffer_send_offset = send_size >> PAGE_SHIFT; | |
3e7ee490 | 187 | |
ae6935ed SH |
188 | return 0; |
189 | } | |
190 | EXPORT_SYMBOL_GPL(vmbus_alloc_ring); | |
72a95cbc | 191 | |
5c23a1a5 | 192 | /* Used for Hyper-V Socket: a guest client's connect() to the host */ |
593db803 AS |
193 | int vmbus_send_tl_connect_request(const guid_t *shv_guest_servie_id, |
194 | const guid_t *shv_host_servie_id) | |
5c23a1a5 DC |
195 | { |
196 | struct vmbus_channel_tl_connect_request conn_msg; | |
98f31a00 | 197 | int ret; |
5c23a1a5 DC |
198 | |
199 | memset(&conn_msg, 0, sizeof(conn_msg)); | |
200 | conn_msg.header.msgtype = CHANNELMSG_TL_CONNECT_REQUEST; | |
201 | conn_msg.guest_endpoint_id = *shv_guest_servie_id; | |
202 | conn_msg.host_service_id = *shv_host_servie_id; | |
203 | ||
98f31a00 VK |
204 | ret = vmbus_post_msg(&conn_msg, sizeof(conn_msg), true); |
205 | ||
206 | trace_vmbus_send_tl_connect_request(&conn_msg, ret); | |
207 | ||
208 | return ret; | |
5c23a1a5 DC |
209 | } |
210 | EXPORT_SYMBOL_GPL(vmbus_send_tl_connect_request); | |
211 | ||
870ced05 APM |
212 | static int send_modifychannel_without_ack(struct vmbus_channel *channel, u32 target_vp) |
213 | { | |
214 | struct vmbus_channel_modifychannel msg; | |
215 | int ret; | |
216 | ||
217 | memset(&msg, 0, sizeof(msg)); | |
218 | msg.header.msgtype = CHANNELMSG_MODIFYCHANNEL; | |
219 | msg.child_relid = channel->offermsg.child_relid; | |
220 | msg.target_vp = target_vp; | |
221 | ||
222 | ret = vmbus_post_msg(&msg, sizeof(msg), true); | |
223 | trace_vmbus_send_modifychannel(&msg, ret); | |
224 | ||
225 | return ret; | |
226 | } | |
227 | ||
228 | static int send_modifychannel_with_ack(struct vmbus_channel *channel, u32 target_vp) | |
229 | { | |
230 | struct vmbus_channel_modifychannel *msg; | |
231 | struct vmbus_channel_msginfo *info; | |
232 | unsigned long flags; | |
233 | int ret; | |
234 | ||
235 | info = kzalloc(sizeof(struct vmbus_channel_msginfo) + | |
236 | sizeof(struct vmbus_channel_modifychannel), | |
237 | GFP_KERNEL); | |
238 | if (!info) | |
239 | return -ENOMEM; | |
240 | ||
241 | init_completion(&info->waitevent); | |
242 | info->waiting_channel = channel; | |
243 | ||
244 | msg = (struct vmbus_channel_modifychannel *)info->msg; | |
245 | msg->header.msgtype = CHANNELMSG_MODIFYCHANNEL; | |
246 | msg->child_relid = channel->offermsg.child_relid; | |
247 | msg->target_vp = target_vp; | |
248 | ||
249 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
250 | list_add_tail(&info->msglistentry, &vmbus_connection.chn_msg_list); | |
251 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
252 | ||
253 | ret = vmbus_post_msg(msg, sizeof(*msg), true); | |
254 | trace_vmbus_send_modifychannel(msg, ret); | |
255 | if (ret != 0) { | |
256 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
257 | list_del(&info->msglistentry); | |
258 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
259 | goto free_info; | |
260 | } | |
261 | ||
262 | /* | |
263 | * Release channel_mutex; otherwise, vmbus_onoffer_rescind() could block on | |
264 | * the mutex and be unable to signal the completion. | |
265 | * | |
266 | * See the caller target_cpu_store() for information about the usage of the | |
267 | * mutex. | |
268 | */ | |
269 | mutex_unlock(&vmbus_connection.channel_mutex); | |
270 | wait_for_completion(&info->waitevent); | |
271 | mutex_lock(&vmbus_connection.channel_mutex); | |
272 | ||
273 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
274 | list_del(&info->msglistentry); | |
275 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
276 | ||
277 | if (info->response.modify_response.status) | |
278 | ret = -EAGAIN; | |
279 | ||
280 | free_info: | |
281 | kfree(info); | |
282 | return ret; | |
283 | } | |
284 | ||
75278105 APM |
285 | /* |
286 | * Set/change the vCPU (@target_vp) the channel (@child_relid) will interrupt. | |
287 | * | |
870ced05 APM |
288 | * CHANNELMSG_MODIFYCHANNEL messages are aynchronous. When VMbus version 5.3 |
289 | * or later is negotiated, Hyper-V always sends an ACK in response to such a | |
290 | * message. For VMbus version 5.2 and earlier, it never sends an ACK. With- | |
291 | * out an ACK, we can not know when the host will stop interrupting the "old" | |
292 | * vCPU and start interrupting the "new" vCPU for the given channel. | |
75278105 APM |
293 | * |
294 | * The CHANNELMSG_MODIFYCHANNEL message type is supported since VMBus version | |
295 | * VERSION_WIN10_V4_1. | |
296 | */ | |
870ced05 | 297 | int vmbus_send_modifychannel(struct vmbus_channel *channel, u32 target_vp) |
75278105 | 298 | { |
870ced05 APM |
299 | if (vmbus_proto_version >= VERSION_WIN10_V5_3) |
300 | return send_modifychannel_with_ack(channel, target_vp); | |
301 | return send_modifychannel_without_ack(channel, target_vp); | |
75278105 APM |
302 | } |
303 | EXPORT_SYMBOL_GPL(vmbus_send_modifychannel); | |
304 | ||
3e189519 | 305 | /* |
fff41b2e | 306 | * create_gpadl_header - Creates a gpadl for the specified buffer |
f4266e34 | 307 | */ |
c1135c7f BF |
308 | static int create_gpadl_header(enum hv_gpadl_type type, void *kbuffer, |
309 | u32 size, u32 send_offset, | |
4d637632 | 310 | struct vmbus_channel_msginfo **msginfo) |
3e7ee490 HJ |
311 | { |
312 | int i; | |
39d70a4a | 313 | int pagecount; |
39d70a4a HZ |
314 | struct vmbus_channel_gpadl_header *gpadl_header; |
315 | struct vmbus_channel_gpadl_body *gpadl_body; | |
316 | struct vmbus_channel_msginfo *msgheader; | |
317 | struct vmbus_channel_msginfo *msgbody = NULL; | |
318 | u32 msgsize; | |
3e7ee490 | 319 | |
39d70a4a | 320 | int pfnsum, pfncount, pfnleft, pfncurr, pfnsize; |
3e7ee490 | 321 | |
c1135c7f | 322 | pagecount = hv_gpadl_size(type, size) >> HV_HYP_PAGE_SHIFT; |
3e7ee490 | 323 | |
454f18a9 | 324 | /* do we need a gpadl body msg */ |
39d70a4a | 325 | pfnsize = MAX_SIZE_CHANNEL_MESSAGE - |
f4266e34 GKH |
326 | sizeof(struct vmbus_channel_gpadl_header) - |
327 | sizeof(struct gpa_range); | |
39d70a4a | 328 | pfncount = pfnsize / sizeof(u64); |
3e7ee490 | 329 | |
39d70a4a | 330 | if (pagecount > pfncount) { |
f4266e34 | 331 | /* we need a gpadl body */ |
454f18a9 | 332 | /* fill in the header */ |
39d70a4a | 333 | msgsize = sizeof(struct vmbus_channel_msginfo) + |
f4266e34 | 334 | sizeof(struct vmbus_channel_gpadl_header) + |
39d70a4a HZ |
335 | sizeof(struct gpa_range) + pfncount * sizeof(u64); |
336 | msgheader = kzalloc(msgsize, GFP_KERNEL); | |
337 | if (!msgheader) | |
d1c250bb | 338 | goto nomem; |
3e7ee490 | 339 | |
c50f7fb2 HZ |
340 | INIT_LIST_HEAD(&msgheader->submsglist); |
341 | msgheader->msgsize = msgsize; | |
3e7ee490 | 342 | |
39d70a4a | 343 | gpadl_header = (struct vmbus_channel_gpadl_header *) |
c50f7fb2 HZ |
344 | msgheader->msg; |
345 | gpadl_header->rangecount = 1; | |
346 | gpadl_header->range_buflen = sizeof(struct gpa_range) + | |
39d70a4a | 347 | pagecount * sizeof(u64); |
415f2287 | 348 | gpadl_header->range[0].byte_offset = 0; |
c1135c7f | 349 | gpadl_header->range[0].byte_count = hv_gpadl_size(type, size); |
39d70a4a | 350 | for (i = 0; i < pfncount; i++) |
c1135c7f BF |
351 | gpadl_header->range[0].pfn_array[i] = hv_gpadl_hvpfn( |
352 | type, kbuffer, size, send_offset, i); | |
39d70a4a | 353 | *msginfo = msgheader; |
3e7ee490 | 354 | |
39d70a4a HZ |
355 | pfnsum = pfncount; |
356 | pfnleft = pagecount - pfncount; | |
3e7ee490 | 357 | |
454f18a9 | 358 | /* how many pfns can we fit */ |
39d70a4a | 359 | pfnsize = MAX_SIZE_CHANNEL_MESSAGE - |
f4266e34 | 360 | sizeof(struct vmbus_channel_gpadl_body); |
39d70a4a | 361 | pfncount = pfnsize / sizeof(u64); |
3e7ee490 | 362 | |
454f18a9 | 363 | /* fill in the body */ |
39d70a4a HZ |
364 | while (pfnleft) { |
365 | if (pfnleft > pfncount) | |
366 | pfncurr = pfncount; | |
3e7ee490 | 367 | else |
39d70a4a | 368 | pfncurr = pfnleft; |
3e7ee490 | 369 | |
39d70a4a | 370 | msgsize = sizeof(struct vmbus_channel_msginfo) + |
f4266e34 | 371 | sizeof(struct vmbus_channel_gpadl_body) + |
39d70a4a HZ |
372 | pfncurr * sizeof(u64); |
373 | msgbody = kzalloc(msgsize, GFP_KERNEL); | |
f38cf9cc S |
374 | |
375 | if (!msgbody) { | |
376 | struct vmbus_channel_msginfo *pos = NULL; | |
377 | struct vmbus_channel_msginfo *tmp = NULL; | |
378 | /* | |
379 | * Free up all the allocated messages. | |
380 | */ | |
381 | list_for_each_entry_safe(pos, tmp, | |
382 | &msgheader->submsglist, | |
383 | msglistentry) { | |
384 | ||
385 | list_del(&pos->msglistentry); | |
386 | kfree(pos); | |
387 | } | |
388 | ||
d1c250bb | 389 | goto nomem; |
f38cf9cc S |
390 | } |
391 | ||
c50f7fb2 | 392 | msgbody->msgsize = msgsize; |
39d70a4a | 393 | gpadl_body = |
c50f7fb2 | 394 | (struct vmbus_channel_gpadl_body *)msgbody->msg; |
f4266e34 GKH |
395 | |
396 | /* | |
f4266e34 GKH |
397 | * Gpadl is u32 and we are using a pointer which could |
398 | * be 64-bit | |
f27df643 | 399 | * This is governed by the guest/host protocol and |
bdc1dd47 | 400 | * so the hypervisor guarantees that this is ok. |
f4266e34 | 401 | */ |
39d70a4a | 402 | for (i = 0; i < pfncurr; i++) |
c1135c7f BF |
403 | gpadl_body->pfn[i] = hv_gpadl_hvpfn(type, |
404 | kbuffer, size, send_offset, pfnsum + i); | |
3e7ee490 | 405 | |
454f18a9 | 406 | /* add to msg header */ |
c50f7fb2 HZ |
407 | list_add_tail(&msgbody->msglistentry, |
408 | &msgheader->submsglist); | |
39d70a4a HZ |
409 | pfnsum += pfncurr; |
410 | pfnleft -= pfncurr; | |
3e7ee490 | 411 | } |
f4266e34 | 412 | } else { |
454f18a9 | 413 | /* everything fits in a header */ |
39d70a4a | 414 | msgsize = sizeof(struct vmbus_channel_msginfo) + |
f4266e34 | 415 | sizeof(struct vmbus_channel_gpadl_header) + |
39d70a4a HZ |
416 | sizeof(struct gpa_range) + pagecount * sizeof(u64); |
417 | msgheader = kzalloc(msgsize, GFP_KERNEL); | |
418 | if (msgheader == NULL) | |
e3eb7cdd | 419 | goto nomem; |
4d637632 VK |
420 | |
421 | INIT_LIST_HEAD(&msgheader->submsglist); | |
c50f7fb2 | 422 | msgheader->msgsize = msgsize; |
39d70a4a HZ |
423 | |
424 | gpadl_header = (struct vmbus_channel_gpadl_header *) | |
c50f7fb2 HZ |
425 | msgheader->msg; |
426 | gpadl_header->rangecount = 1; | |
427 | gpadl_header->range_buflen = sizeof(struct gpa_range) + | |
39d70a4a | 428 | pagecount * sizeof(u64); |
415f2287 | 429 | gpadl_header->range[0].byte_offset = 0; |
c1135c7f | 430 | gpadl_header->range[0].byte_count = hv_gpadl_size(type, size); |
39d70a4a | 431 | for (i = 0; i < pagecount; i++) |
c1135c7f BF |
432 | gpadl_header->range[0].pfn_array[i] = hv_gpadl_hvpfn( |
433 | type, kbuffer, size, send_offset, i); | |
39d70a4a HZ |
434 | |
435 | *msginfo = msgheader; | |
3e7ee490 HJ |
436 | } |
437 | ||
438 | return 0; | |
d1c250bb | 439 | nomem: |
39d70a4a HZ |
440 | kfree(msgheader); |
441 | kfree(msgbody); | |
d1c250bb | 442 | return -ENOMEM; |
3e7ee490 HJ |
443 | } |
444 | ||
3e189519 | 445 | /* |
c1135c7f | 446 | * __vmbus_establish_gpadl - Establish a GPADL for a buffer or ringbuffer |
f4266e34 | 447 | * |
39d70a4a | 448 | * @channel: a channel |
c1135c7f | 449 | * @type: the type of the corresponding GPADL, only meaningful for the guest. |
b679ef73 | 450 | * @kbuffer: from kmalloc or vmalloc |
39d70a4a | 451 | * @size: page-size multiple |
c1135c7f | 452 | * @send_offset: the offset (in bytes) where the send ring buffer starts, |
f850a4ca | 453 | * should be 0 for BUFFER type gpadl |
39d70a4a | 454 | * @gpadl_handle: some funky thing |
f4266e34 | 455 | */ |
c1135c7f BF |
456 | static int __vmbus_establish_gpadl(struct vmbus_channel *channel, |
457 | enum hv_gpadl_type type, void *kbuffer, | |
458 | u32 size, u32 send_offset, | |
459 | u32 *gpadl_handle) | |
3e7ee490 | 460 | { |
39d70a4a HZ |
461 | struct vmbus_channel_gpadl_header *gpadlmsg; |
462 | struct vmbus_channel_gpadl_body *gpadl_body; | |
39d70a4a | 463 | struct vmbus_channel_msginfo *msginfo = NULL; |
7cc80c98 | 464 | struct vmbus_channel_msginfo *submsginfo, *tmp; |
53af545b | 465 | struct list_head *curr; |
39d70a4a | 466 | u32 next_gpadl_handle; |
dd0813b6 | 467 | unsigned long flags; |
c3bf2e26 | 468 | int ret = 0; |
3e7ee490 | 469 | |
9f52a163 S |
470 | next_gpadl_handle = |
471 | (atomic_inc_return(&vmbus_connection.next_gpadl_handle) - 1); | |
3e7ee490 | 472 | |
c1135c7f | 473 | ret = create_gpadl_header(type, kbuffer, size, send_offset, &msginfo); |
c3bf2e26 BP |
474 | if (ret) |
475 | return ret; | |
3e7ee490 | 476 | |
9568a193 | 477 | init_completion(&msginfo->waitevent); |
ccb61f8a | 478 | msginfo->waiting_channel = channel; |
c3bf2e26 | 479 | |
c50f7fb2 HZ |
480 | gpadlmsg = (struct vmbus_channel_gpadl_header *)msginfo->msg; |
481 | gpadlmsg->header.msgtype = CHANNELMSG_GPADL_HEADER; | |
482 | gpadlmsg->child_relid = channel->offermsg.child_relid; | |
483 | gpadlmsg->gpadl = next_gpadl_handle; | |
3e7ee490 | 484 | |
3e7ee490 | 485 | |
15b2f647 | 486 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); |
c50f7fb2 | 487 | list_add_tail(&msginfo->msglistentry, |
da9fcb72 | 488 | &vmbus_connection.chn_msg_list); |
3e7ee490 | 489 | |
15b2f647 | 490 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); |
3e7ee490 | 491 | |
6f3d791f S |
492 | if (channel->rescind) { |
493 | ret = -ENODEV; | |
494 | goto cleanup; | |
495 | } | |
496 | ||
c6977677 | 497 | ret = vmbus_post_msg(gpadlmsg, msginfo->msgsize - |
c0bb0392 | 498 | sizeof(*msginfo), true); |
69edbd5f VK |
499 | |
500 | trace_vmbus_establish_gpadl_header(gpadlmsg, ret); | |
501 | ||
98e08702 | 502 | if (ret != 0) |
00d760b0 | 503 | goto cleanup; |
3e7ee490 | 504 | |
4d637632 VK |
505 | list_for_each(curr, &msginfo->submsglist) { |
506 | submsginfo = (struct vmbus_channel_msginfo *)curr; | |
507 | gpadl_body = | |
508 | (struct vmbus_channel_gpadl_body *)submsginfo->msg; | |
53af545b | 509 | |
4d637632 VK |
510 | gpadl_body->header.msgtype = |
511 | CHANNELMSG_GPADL_BODY; | |
512 | gpadl_body->gpadl = next_gpadl_handle; | |
3e7ee490 | 513 | |
4d637632 | 514 | ret = vmbus_post_msg(gpadl_body, |
c0bb0392 VK |
515 | submsginfo->msgsize - sizeof(*submsginfo), |
516 | true); | |
69edbd5f VK |
517 | |
518 | trace_vmbus_establish_gpadl_body(gpadl_body, ret); | |
519 | ||
4d637632 VK |
520 | if (ret != 0) |
521 | goto cleanup; | |
3e7ee490 | 522 | |
3e7ee490 | 523 | } |
72c6b71c | 524 | wait_for_completion(&msginfo->waitevent); |
3e7ee490 | 525 | |
eceb0596 DC |
526 | if (msginfo->response.gpadl_created.creation_status != 0) { |
527 | pr_err("Failed to establish GPADL: err = 0x%x\n", | |
528 | msginfo->response.gpadl_created.creation_status); | |
529 | ||
530 | ret = -EDQUOT; | |
531 | goto cleanup; | |
532 | } | |
533 | ||
ccb61f8a S |
534 | if (channel->rescind) { |
535 | ret = -ENODEV; | |
536 | goto cleanup; | |
537 | } | |
538 | ||
454f18a9 | 539 | /* At this point, we received the gpadl created msg */ |
c50f7fb2 | 540 | *gpadl_handle = gpadlmsg->gpadl; |
3e7ee490 | 541 | |
00d760b0 | 542 | cleanup: |
15b2f647 | 543 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); |
c50f7fb2 | 544 | list_del(&msginfo->msglistentry); |
15b2f647 | 545 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); |
7cc80c98 VK |
546 | list_for_each_entry_safe(submsginfo, tmp, &msginfo->submsglist, |
547 | msglistentry) { | |
548 | kfree(submsginfo); | |
549 | } | |
3e7ee490 | 550 | |
39d70a4a | 551 | kfree(msginfo); |
3e7ee490 HJ |
552 | return ret; |
553 | } | |
c1135c7f BF |
554 | |
555 | /* | |
556 | * vmbus_establish_gpadl - Establish a GPADL for the specified buffer | |
557 | * | |
558 | * @channel: a channel | |
559 | * @kbuffer: from kmalloc or vmalloc | |
560 | * @size: page-size multiple | |
561 | * @gpadl_handle: some funky thing | |
562 | */ | |
563 | int vmbus_establish_gpadl(struct vmbus_channel *channel, void *kbuffer, | |
564 | u32 size, u32 *gpadl_handle) | |
565 | { | |
566 | return __vmbus_establish_gpadl(channel, HV_GPADL_BUFFER, kbuffer, size, | |
567 | 0U, gpadl_handle); | |
568 | } | |
98873724 | 569 | EXPORT_SYMBOL_GPL(vmbus_establish_gpadl); |
3e7ee490 | 570 | |
e8b7db38 AB |
571 | /** |
572 | * request_arr_init - Allocates memory for the requestor array. Each slot | |
573 | * keeps track of the next available slot in the array. Initially, each | |
574 | * slot points to the next one (as in a Linked List). The last slot | |
575 | * does not point to anything, so its value is U64_MAX by default. | |
576 | * @size The size of the array | |
577 | */ | |
578 | static u64 *request_arr_init(u32 size) | |
579 | { | |
580 | int i; | |
581 | u64 *req_arr; | |
582 | ||
583 | req_arr = kcalloc(size, sizeof(u64), GFP_KERNEL); | |
584 | if (!req_arr) | |
585 | return NULL; | |
586 | ||
587 | for (i = 0; i < size - 1; i++) | |
588 | req_arr[i] = i + 1; | |
589 | ||
590 | /* Last slot (no more available slots) */ | |
591 | req_arr[i] = U64_MAX; | |
592 | ||
593 | return req_arr; | |
594 | } | |
595 | ||
596 | /* | |
597 | * vmbus_alloc_requestor - Initializes @rqstor's fields. | |
598 | * Index 0 is the first free slot | |
599 | * @size: Size of the requestor array | |
600 | */ | |
601 | static int vmbus_alloc_requestor(struct vmbus_requestor *rqstor, u32 size) | |
602 | { | |
603 | u64 *rqst_arr; | |
604 | unsigned long *bitmap; | |
605 | ||
606 | rqst_arr = request_arr_init(size); | |
607 | if (!rqst_arr) | |
608 | return -ENOMEM; | |
609 | ||
610 | bitmap = bitmap_zalloc(size, GFP_KERNEL); | |
611 | if (!bitmap) { | |
612 | kfree(rqst_arr); | |
613 | return -ENOMEM; | |
614 | } | |
615 | ||
616 | rqstor->req_arr = rqst_arr; | |
617 | rqstor->req_bitmap = bitmap; | |
618 | rqstor->size = size; | |
619 | rqstor->next_request_id = 0; | |
620 | spin_lock_init(&rqstor->req_lock); | |
621 | ||
622 | return 0; | |
623 | } | |
624 | ||
625 | /* | |
626 | * vmbus_free_requestor - Frees memory allocated for @rqstor | |
627 | * @rqstor: Pointer to the requestor struct | |
628 | */ | |
629 | static void vmbus_free_requestor(struct vmbus_requestor *rqstor) | |
630 | { | |
631 | kfree(rqstor->req_arr); | |
632 | bitmap_free(rqstor->req_bitmap); | |
633 | } | |
634 | ||
edd9bbc1 BF |
635 | static int __vmbus_open(struct vmbus_channel *newchannel, |
636 | void *userdata, u32 userdatalen, | |
637 | void (*onchannelcallback)(void *context), void *context) | |
638 | { | |
639 | struct vmbus_channel_open_channel *open_msg; | |
640 | struct vmbus_channel_msginfo *open_info = NULL; | |
641 | struct page *page = newchannel->ringbuffer_page; | |
642 | u32 send_pages, recv_pages; | |
643 | unsigned long flags; | |
644 | int err; | |
645 | ||
646 | if (userdatalen > MAX_USER_DEFINED_BYTES) | |
647 | return -EINVAL; | |
648 | ||
649 | send_pages = newchannel->ringbuffer_send_offset; | |
650 | recv_pages = newchannel->ringbuffer_pagecount - send_pages; | |
651 | ||
652 | if (newchannel->state != CHANNEL_OPEN_STATE) | |
653 | return -EINVAL; | |
654 | ||
e8b7db38 AB |
655 | /* Create and init requestor */ |
656 | if (newchannel->rqstor_size) { | |
657 | if (vmbus_alloc_requestor(&newchannel->requestor, newchannel->rqstor_size)) | |
658 | return -ENOMEM; | |
659 | } | |
660 | ||
edd9bbc1 BF |
661 | newchannel->state = CHANNEL_OPENING_STATE; |
662 | newchannel->onchannel_callback = onchannelcallback; | |
663 | newchannel->channel_callback_context = context; | |
664 | ||
adae1e93 AB |
665 | if (!newchannel->max_pkt_size) |
666 | newchannel->max_pkt_size = VMBUS_DEFAULT_MAX_PKT_SIZE; | |
667 | ||
668 | err = hv_ringbuffer_init(&newchannel->outbound, page, send_pages, 0); | |
edd9bbc1 BF |
669 | if (err) |
670 | goto error_clean_ring; | |
671 | ||
adae1e93 AB |
672 | err = hv_ringbuffer_init(&newchannel->inbound, &page[send_pages], |
673 | recv_pages, newchannel->max_pkt_size); | |
edd9bbc1 BF |
674 | if (err) |
675 | goto error_clean_ring; | |
676 | ||
677 | /* Establish the gpadl for the ring buffer */ | |
678 | newchannel->ringbuffer_gpadlhandle = 0; | |
679 | ||
c1135c7f BF |
680 | err = __vmbus_establish_gpadl(newchannel, HV_GPADL_RING, |
681 | page_address(newchannel->ringbuffer_page), | |
682 | (send_pages + recv_pages) << PAGE_SHIFT, | |
683 | newchannel->ringbuffer_send_offset << PAGE_SHIFT, | |
684 | &newchannel->ringbuffer_gpadlhandle); | |
edd9bbc1 BF |
685 | if (err) |
686 | goto error_clean_ring; | |
687 | ||
688 | /* Create and init the channel open message */ | |
e99c4afb | 689 | open_info = kzalloc(sizeof(*open_info) + |
edd9bbc1 BF |
690 | sizeof(struct vmbus_channel_open_channel), |
691 | GFP_KERNEL); | |
692 | if (!open_info) { | |
693 | err = -ENOMEM; | |
694 | goto error_free_gpadl; | |
695 | } | |
696 | ||
697 | init_completion(&open_info->waitevent); | |
698 | open_info->waiting_channel = newchannel; | |
699 | ||
700 | open_msg = (struct vmbus_channel_open_channel *)open_info->msg; | |
701 | open_msg->header.msgtype = CHANNELMSG_OPENCHANNEL; | |
702 | open_msg->openid = newchannel->offermsg.child_relid; | |
703 | open_msg->child_relid = newchannel->offermsg.child_relid; | |
704 | open_msg->ringbuffer_gpadlhandle = newchannel->ringbuffer_gpadlhandle; | |
c1135c7f BF |
705 | /* |
706 | * The unit of ->downstream_ringbuffer_pageoffset is HV_HYP_PAGE and | |
707 | * the unit of ->ringbuffer_send_offset (i.e. send_pages) is PAGE, so | |
708 | * here we calculate it into HV_HYP_PAGE. | |
709 | */ | |
710 | open_msg->downstream_ringbuffer_pageoffset = | |
711 | hv_ring_gpadl_send_hvpgoffset(send_pages << PAGE_SHIFT); | |
edd9bbc1 BF |
712 | open_msg->target_vp = hv_cpu_number_to_vp_number(newchannel->target_cpu); |
713 | ||
714 | if (userdatalen) | |
715 | memcpy(open_msg->userdata, userdata, userdatalen); | |
716 | ||
717 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
718 | list_add_tail(&open_info->msglistentry, | |
719 | &vmbus_connection.chn_msg_list); | |
720 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
721 | ||
722 | if (newchannel->rescind) { | |
723 | err = -ENODEV; | |
3e9bf43f | 724 | goto error_clean_msglist; |
edd9bbc1 BF |
725 | } |
726 | ||
727 | err = vmbus_post_msg(open_msg, | |
728 | sizeof(struct vmbus_channel_open_channel), true); | |
729 | ||
730 | trace_vmbus_open(open_msg, err); | |
731 | ||
732 | if (err != 0) | |
733 | goto error_clean_msglist; | |
734 | ||
735 | wait_for_completion(&open_info->waitevent); | |
736 | ||
737 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
738 | list_del(&open_info->msglistentry); | |
739 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
740 | ||
741 | if (newchannel->rescind) { | |
742 | err = -ENODEV; | |
743 | goto error_free_info; | |
744 | } | |
745 | ||
746 | if (open_info->response.open_result.status) { | |
747 | err = -EAGAIN; | |
748 | goto error_free_info; | |
749 | } | |
750 | ||
751 | newchannel->state = CHANNEL_OPENED_STATE; | |
752 | kfree(open_info); | |
753 | return 0; | |
754 | ||
755 | error_clean_msglist: | |
756 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); | |
757 | list_del(&open_info->msglistentry); | |
758 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); | |
759 | error_free_info: | |
760 | kfree(open_info); | |
761 | error_free_gpadl: | |
762 | vmbus_teardown_gpadl(newchannel, newchannel->ringbuffer_gpadlhandle); | |
763 | newchannel->ringbuffer_gpadlhandle = 0; | |
764 | error_clean_ring: | |
765 | hv_ringbuffer_cleanup(&newchannel->outbound); | |
766 | hv_ringbuffer_cleanup(&newchannel->inbound); | |
e8b7db38 | 767 | vmbus_free_requestor(&newchannel->requestor); |
edd9bbc1 BF |
768 | newchannel->state = CHANNEL_OPEN_STATE; |
769 | return err; | |
770 | } | |
771 | ||
772 | /* | |
773 | * vmbus_connect_ring - Open the channel but reuse ring buffer | |
774 | */ | |
775 | int vmbus_connect_ring(struct vmbus_channel *newchannel, | |
776 | void (*onchannelcallback)(void *context), void *context) | |
777 | { | |
778 | return __vmbus_open(newchannel, NULL, 0, onchannelcallback, context); | |
779 | } | |
780 | EXPORT_SYMBOL_GPL(vmbus_connect_ring); | |
781 | ||
782 | /* | |
783 | * vmbus_open - Open the specified channel. | |
784 | */ | |
785 | int vmbus_open(struct vmbus_channel *newchannel, | |
786 | u32 send_ringbuffer_size, u32 recv_ringbuffer_size, | |
787 | void *userdata, u32 userdatalen, | |
788 | void (*onchannelcallback)(void *context), void *context) | |
789 | { | |
790 | int err; | |
791 | ||
792 | err = vmbus_alloc_ring(newchannel, send_ringbuffer_size, | |
793 | recv_ringbuffer_size); | |
794 | if (err) | |
795 | return err; | |
796 | ||
797 | err = __vmbus_open(newchannel, userdata, userdatalen, | |
798 | onchannelcallback, context); | |
799 | if (err) | |
800 | vmbus_free_ring(newchannel); | |
801 | ||
802 | return err; | |
803 | } | |
804 | EXPORT_SYMBOL_GPL(vmbus_open); | |
805 | ||
3e189519 | 806 | /* |
fff41b2e | 807 | * vmbus_teardown_gpadl -Teardown the specified GPADL handle |
f4266e34 | 808 | */ |
fff41b2e | 809 | int vmbus_teardown_gpadl(struct vmbus_channel *channel, u32 gpadl_handle) |
3e7ee490 | 810 | { |
82250213 | 811 | struct vmbus_channel_gpadl_teardown *msg; |
aded7165 | 812 | struct vmbus_channel_msginfo *info; |
dd0813b6 | 813 | unsigned long flags; |
66be6530 | 814 | int ret; |
3e7ee490 | 815 | |
e99c4afb | 816 | info = kzalloc(sizeof(*info) + |
f4266e34 | 817 | sizeof(struct vmbus_channel_gpadl_teardown), GFP_KERNEL); |
c3bf2e26 BP |
818 | if (!info) |
819 | return -ENOMEM; | |
3e7ee490 | 820 | |
9568a193 | 821 | init_completion(&info->waitevent); |
ccb61f8a | 822 | info->waiting_channel = channel; |
3e7ee490 | 823 | |
c50f7fb2 | 824 | msg = (struct vmbus_channel_gpadl_teardown *)info->msg; |
3e7ee490 | 825 | |
c50f7fb2 HZ |
826 | msg->header.msgtype = CHANNELMSG_GPADL_TEARDOWN; |
827 | msg->child_relid = channel->offermsg.child_relid; | |
828 | msg->gpadl = gpadl_handle; | |
3e7ee490 | 829 | |
15b2f647 | 830 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); |
c50f7fb2 | 831 | list_add_tail(&info->msglistentry, |
da9fcb72 | 832 | &vmbus_connection.chn_msg_list); |
15b2f647 | 833 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); |
6f3d791f S |
834 | |
835 | if (channel->rescind) | |
836 | goto post_msg_err; | |
837 | ||
c0bb0392 VK |
838 | ret = vmbus_post_msg(msg, sizeof(struct vmbus_channel_gpadl_teardown), |
839 | true); | |
3e7ee490 | 840 | |
09cdf8f8 VK |
841 | trace_vmbus_teardown_gpadl(msg, ret); |
842 | ||
66be6530 S |
843 | if (ret) |
844 | goto post_msg_err; | |
845 | ||
846 | wait_for_completion(&info->waitevent); | |
3e7ee490 | 847 | |
66be6530 | 848 | post_msg_err: |
5e030d5c S |
849 | /* |
850 | * If the channel has been rescinded; | |
851 | * we will be awakened by the rescind | |
852 | * handler; set the error code to zero so we don't leak memory. | |
853 | */ | |
854 | if (channel->rescind) | |
855 | ret = 0; | |
856 | ||
15b2f647 | 857 | spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags); |
c50f7fb2 | 858 | list_del(&info->msglistentry); |
15b2f647 | 859 | spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags); |
3e7ee490 | 860 | |
8c69f52a | 861 | kfree(info); |
3e7ee490 HJ |
862 | return ret; |
863 | } | |
18726d7a | 864 | EXPORT_SYMBOL_GPL(vmbus_teardown_gpadl); |
3e7ee490 | 865 | |
d3b26dd7 | 866 | void vmbus_reset_channel_cb(struct vmbus_channel *channel) |
3e7ee490 | 867 | { |
9403b66e APM |
868 | unsigned long flags; |
869 | ||
63d55b2a | 870 | /* |
dad72a1d | 871 | * vmbus_on_event(), running in the per-channel tasklet, can race |
63d55b2a DC |
872 | * with vmbus_close_internal() in the case of SMP guest, e.g., when |
873 | * the former is accessing channel->inbound.ring_buffer, the latter | |
dad72a1d DC |
874 | * could be freeing the ring_buffer pages, so here we must stop it |
875 | * first. | |
ac504767 APM |
876 | * |
877 | * vmbus_chan_sched() might call the netvsc driver callback function | |
878 | * that ends up scheduling NAPI work that accesses the ring buffer. | |
879 | * At this point, we have to ensure that any such work is completed | |
880 | * and that the channel ring buffer is no longer being accessed, cf. | |
881 | * the calls to napi_disable() in netvsc_device_remove(). | |
63d55b2a | 882 | */ |
dad72a1d | 883 | tasklet_disable(&channel->callback_event); |
63d55b2a | 884 | |
9403b66e APM |
885 | /* See the inline comments in vmbus_chan_sched(). */ |
886 | spin_lock_irqsave(&channel->sched_lock, flags); | |
887 | channel->onchannel_callback = NULL; | |
888 | spin_unlock_irqrestore(&channel->sched_lock, flags); | |
d3b26dd7 | 889 | |
9403b66e | 890 | channel->sc_creation_callback = NULL; |
d3b26dd7 DC |
891 | |
892 | /* Re-enable tasklet for use on re-open */ | |
893 | tasklet_enable(&channel->callback_event); | |
894 | } | |
895 | ||
896 | static int vmbus_close_internal(struct vmbus_channel *channel) | |
897 | { | |
898 | struct vmbus_channel_close_channel *msg; | |
899 | int ret; | |
900 | ||
901 | vmbus_reset_channel_cb(channel); | |
902 | ||
64b7faf9 DC |
903 | /* |
904 | * In case a device driver's probe() fails (e.g., | |
905 | * util_probe() -> vmbus_open() returns -ENOMEM) and the device is | |
8a1115ff | 906 | * rescinded later (e.g., we dynamically disable an Integrated Service |
64b7faf9 DC |
907 | * in Hyper-V Manager), the driver's remove() invokes vmbus_close(): |
908 | * here we should skip most of the below cleanup work. | |
909 | */ | |
ae6935ed SH |
910 | if (channel->state != CHANNEL_OPENED_STATE) |
911 | return -EINVAL; | |
64b7faf9 | 912 | |
e68d2971 | 913 | channel->state = CHANNEL_OPEN_STATE; |
3e7ee490 | 914 | |
454f18a9 | 915 | /* Send a closing message */ |
3e7ee490 | 916 | |
e9a27a9f | 917 | msg = &channel->close_msg.msg; |
3e7ee490 | 918 | |
c50f7fb2 HZ |
919 | msg->header.msgtype = CHANNELMSG_CLOSECHANNEL; |
920 | msg->child_relid = channel->offermsg.child_relid; | |
3e7ee490 | 921 | |
c0bb0392 VK |
922 | ret = vmbus_post_msg(msg, sizeof(struct vmbus_channel_close_channel), |
923 | true); | |
3e7ee490 | 924 | |
633b005d VK |
925 | trace_vmbus_close_internal(msg, ret); |
926 | ||
98d731bb S |
927 | if (ret) { |
928 | pr_err("Close failed: close post msg return is %d\n", ret); | |
929 | /* | |
930 | * If we failed to post the close msg, | |
931 | * it is perhaps better to leak memory. | |
932 | */ | |
98d731bb S |
933 | } |
934 | ||
454f18a9 | 935 | /* Tear down the gpadl for the channel's ring buffer */ |
ae6935ed | 936 | else if (channel->ringbuffer_gpadlhandle) { |
98d731bb S |
937 | ret = vmbus_teardown_gpadl(channel, |
938 | channel->ringbuffer_gpadlhandle); | |
939 | if (ret) { | |
940 | pr_err("Close failed: teardown gpadl return %d\n", ret); | |
941 | /* | |
942 | * If we failed to teardown gpadl, | |
943 | * it is perhaps better to leak memory. | |
944 | */ | |
98d731bb | 945 | } |
3e7ee490 | 946 | |
ae6935ed SH |
947 | channel->ringbuffer_gpadlhandle = 0; |
948 | } | |
3e7ee490 | 949 | |
e8b7db38 AB |
950 | if (!ret) |
951 | vmbus_free_requestor(&channel->requestor); | |
952 | ||
98d731bb | 953 | return ret; |
3e7ee490 | 954 | } |
e68d2971 | 955 | |
ae6935ed SH |
956 | /* disconnect ring - close all channels */ |
957 | int vmbus_disconnect_ring(struct vmbus_channel *channel) | |
e68d2971 | 958 | { |
ae6935ed | 959 | struct vmbus_channel *cur_channel, *tmp; |
ae6935ed | 960 | int ret; |
e68d2971 | 961 | |
ae6935ed SH |
962 | if (channel->primary_channel != NULL) |
963 | return -EINVAL; | |
964 | ||
b5679ceb | 965 | list_for_each_entry_safe(cur_channel, tmp, &channel->sc_list, sc_list) { |
ae6935ed | 966 | if (cur_channel->rescind) |
7fa32e5e | 967 | wait_for_completion(&cur_channel->rescind_event); |
ae6935ed SH |
968 | |
969 | mutex_lock(&vmbus_connection.channel_mutex); | |
970 | if (vmbus_close_internal(cur_channel) == 0) { | |
971 | vmbus_free_ring(cur_channel); | |
972 | ||
973 | if (cur_channel->rescind) | |
974 | hv_process_channel_removal(cur_channel); | |
54a66265 | 975 | } |
7fa32e5e | 976 | mutex_unlock(&vmbus_connection.channel_mutex); |
e68d2971 | 977 | } |
ae6935ed | 978 | |
e68d2971 S |
979 | /* |
980 | * Now close the primary. | |
981 | */ | |
7fa32e5e | 982 | mutex_lock(&vmbus_connection.channel_mutex); |
ae6935ed | 983 | ret = vmbus_close_internal(channel); |
192b2d78 | 984 | mutex_unlock(&vmbus_connection.channel_mutex); |
ae6935ed SH |
985 | |
986 | return ret; | |
987 | } | |
988 | EXPORT_SYMBOL_GPL(vmbus_disconnect_ring); | |
989 | ||
990 | /* | |
991 | * vmbus_close - Close the specified channel | |
992 | */ | |
993 | void vmbus_close(struct vmbus_channel *channel) | |
994 | { | |
995 | if (vmbus_disconnect_ring(channel) == 0) | |
996 | vmbus_free_ring(channel); | |
e68d2971 | 997 | } |
70bfa307 | 998 | EXPORT_SYMBOL_GPL(vmbus_close); |
3e7ee490 | 999 | |
5dd0fb9b | 1000 | /** |
1001 | * vmbus_sendpacket() - Send the specified buffer on the given channel | |
fe857bb4 DC |
1002 | * @channel: Pointer to vmbus_channel structure |
1003 | * @buffer: Pointer to the buffer you want to send the data from. | |
1004 | * @bufferlen: Maximum size of what the buffer holds. | |
5dd0fb9b | 1005 | * @requestid: Identifier of the request |
fe857bb4 DC |
1006 | * @type: Type of packet that is being sent e.g. negotiate, time |
1007 | * packet etc. | |
1008 | * @flags: 0 or VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED | |
5dd0fb9b | 1009 | * |
fe857bb4 DC |
1010 | * Sends data in @buffer directly to Hyper-V via the vmbus. |
1011 | * This will send the data unparsed to Hyper-V. | |
5dd0fb9b | 1012 | * |
1013 | * Mainly used by Hyper-V drivers. | |
1014 | */ | |
1015 | int vmbus_sendpacket(struct vmbus_channel *channel, void *buffer, | |
1016 | u32 bufferlen, u64 requestid, | |
1017 | enum vmbus_packet_type type, u32 flags) | |
3e7ee490 | 1018 | { |
8dc0a06a | 1019 | struct vmpacket_descriptor desc; |
39d70a4a | 1020 | u32 packetlen = sizeof(struct vmpacket_descriptor) + bufferlen; |
73509681 | 1021 | u32 packetlen_aligned = ALIGN(packetlen, sizeof(u64)); |
011a7c3c | 1022 | struct kvec bufferlist[3]; |
39d70a4a | 1023 | u64 aligned_data = 0; |
b81658cf | 1024 | int num_vecs = ((bufferlen != 0) ? 3 : 1); |
3e7ee490 | 1025 | |
3e7ee490 | 1026 | |
454f18a9 | 1027 | /* Setup the descriptor */ |
415f2287 HZ |
1028 | desc.type = type; /* VmbusPacketTypeDataInBand; */ |
1029 | desc.flags = flags; /* VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED; */ | |
f4266e34 | 1030 | /* in 8-bytes granularity */ |
415f2287 HZ |
1031 | desc.offset8 = sizeof(struct vmpacket_descriptor) >> 3; |
1032 | desc.len8 = (u16)(packetlen_aligned >> 3); | |
e8b7db38 | 1033 | desc.trans_id = VMBUS_RQST_ERROR; /* will be updated in hv_ringbuffer_write() */ |
3e7ee490 | 1034 | |
011a7c3c S |
1035 | bufferlist[0].iov_base = &desc; |
1036 | bufferlist[0].iov_len = sizeof(struct vmpacket_descriptor); | |
1037 | bufferlist[1].iov_base = buffer; | |
1038 | bufferlist[1].iov_len = bufferlen; | |
1039 | bufferlist[2].iov_base = &aligned_data; | |
1040 | bufferlist[2].iov_len = (packetlen_aligned - packetlen); | |
3e7ee490 | 1041 | |
e8b7db38 | 1042 | return hv_ringbuffer_write(channel, bufferlist, num_vecs, requestid); |
3e7ee490 | 1043 | } |
fff41b2e | 1044 | EXPORT_SYMBOL(vmbus_sendpacket); |
3e7ee490 | 1045 | |
3e189519 | 1046 | /* |
5a668d8c | 1047 | * vmbus_sendpacket_pagebuffer - Send a range of single-page buffer |
87e93d61 S |
1048 | * packets using a GPADL Direct packet type. This interface allows you |
1049 | * to control notifying the host. This will be useful for sending | |
1050 | * batched data. Also the sender can control the send flags | |
1051 | * explicitly. | |
f4266e34 | 1052 | */ |
5a668d8c | 1053 | int vmbus_sendpacket_pagebuffer(struct vmbus_channel *channel, |
1054 | struct hv_page_buffer pagebuffers[], | |
1055 | u32 pagecount, void *buffer, u32 bufferlen, | |
1056 | u64 requestid) | |
3e7ee490 | 1057 | { |
f4266e34 | 1058 | int i; |
430a8e9a | 1059 | struct vmbus_channel_packet_page_buffer desc; |
39d70a4a HZ |
1060 | u32 descsize; |
1061 | u32 packetlen; | |
1062 | u32 packetlen_aligned; | |
011a7c3c | 1063 | struct kvec bufferlist[3]; |
39d70a4a | 1064 | u64 aligned_data = 0; |
3e7ee490 | 1065 | |
39d70a4a | 1066 | if (pagecount > MAX_PAGE_BUFFER_COUNT) |
002b53ea | 1067 | return -EINVAL; |
3e7ee490 | 1068 | |
f4266e34 | 1069 | /* |
430a8e9a | 1070 | * Adjust the size down since vmbus_channel_packet_page_buffer is the |
f4266e34 GKH |
1071 | * largest size we support |
1072 | */ | |
39d70a4a HZ |
1073 | descsize = sizeof(struct vmbus_channel_packet_page_buffer) - |
1074 | ((MAX_PAGE_BUFFER_COUNT - pagecount) * | |
f4266e34 | 1075 | sizeof(struct hv_page_buffer)); |
39d70a4a | 1076 | packetlen = descsize + bufferlen; |
73509681 | 1077 | packetlen_aligned = ALIGN(packetlen, sizeof(u64)); |
3e7ee490 | 1078 | |
454f18a9 | 1079 | /* Setup the descriptor */ |
415f2287 | 1080 | desc.type = VM_PKT_DATA_USING_GPA_DIRECT; |
5a668d8c | 1081 | desc.flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED; |
bdc1dd47 | 1082 | desc.dataoffset8 = descsize >> 3; /* in 8-bytes granularity */ |
39d70a4a | 1083 | desc.length8 = (u16)(packetlen_aligned >> 3); |
e8b7db38 | 1084 | desc.transactionid = VMBUS_RQST_ERROR; /* will be updated in hv_ringbuffer_write() */ |
33d426a9 | 1085 | desc.reserved = 0; |
39d70a4a HZ |
1086 | desc.rangecount = pagecount; |
1087 | ||
1088 | for (i = 0; i < pagecount; i++) { | |
ca623ad3 HZ |
1089 | desc.range[i].len = pagebuffers[i].len; |
1090 | desc.range[i].offset = pagebuffers[i].offset; | |
1091 | desc.range[i].pfn = pagebuffers[i].pfn; | |
3e7ee490 HJ |
1092 | } |
1093 | ||
011a7c3c S |
1094 | bufferlist[0].iov_base = &desc; |
1095 | bufferlist[0].iov_len = descsize; | |
1096 | bufferlist[1].iov_base = buffer; | |
1097 | bufferlist[1].iov_len = bufferlen; | |
1098 | bufferlist[2].iov_base = &aligned_data; | |
1099 | bufferlist[2].iov_len = (packetlen_aligned - packetlen); | |
3e7ee490 | 1100 | |
e8b7db38 | 1101 | return hv_ringbuffer_write(channel, bufferlist, 3, requestid); |
3e7ee490 | 1102 | } |
713efeb4 | 1103 | EXPORT_SYMBOL_GPL(vmbus_sendpacket_pagebuffer); |
3e7ee490 | 1104 | |
d61031ee S |
1105 | /* |
1106 | * vmbus_sendpacket_multipagebuffer - Send a multi-page buffer packet | |
1107 | * using a GPADL Direct packet type. | |
1108 | * The buffer includes the vmbus descriptor. | |
1109 | */ | |
1110 | int vmbus_sendpacket_mpb_desc(struct vmbus_channel *channel, | |
1111 | struct vmbus_packet_mpb_array *desc, | |
1112 | u32 desc_size, | |
1113 | void *buffer, u32 bufferlen, u64 requestid) | |
1114 | { | |
d61031ee S |
1115 | u32 packetlen; |
1116 | u32 packetlen_aligned; | |
1117 | struct kvec bufferlist[3]; | |
1118 | u64 aligned_data = 0; | |
d61031ee S |
1119 | |
1120 | packetlen = desc_size + bufferlen; | |
1121 | packetlen_aligned = ALIGN(packetlen, sizeof(u64)); | |
1122 | ||
1123 | /* Setup the descriptor */ | |
1124 | desc->type = VM_PKT_DATA_USING_GPA_DIRECT; | |
1125 | desc->flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED; | |
bdc1dd47 | 1126 | desc->dataoffset8 = desc_size >> 3; /* in 8-bytes granularity */ |
d61031ee | 1127 | desc->length8 = (u16)(packetlen_aligned >> 3); |
e8b7db38 | 1128 | desc->transactionid = VMBUS_RQST_ERROR; /* will be updated in hv_ringbuffer_write() */ |
33d426a9 | 1129 | desc->reserved = 0; |
d61031ee S |
1130 | desc->rangecount = 1; |
1131 | ||
1132 | bufferlist[0].iov_base = desc; | |
1133 | bufferlist[0].iov_len = desc_size; | |
1134 | bufferlist[1].iov_base = buffer; | |
1135 | bufferlist[1].iov_len = bufferlen; | |
1136 | bufferlist[2].iov_base = &aligned_data; | |
1137 | bufferlist[2].iov_len = (packetlen_aligned - packetlen); | |
1138 | ||
e8b7db38 | 1139 | return hv_ringbuffer_write(channel, bufferlist, 3, requestid); |
d61031ee S |
1140 | } |
1141 | EXPORT_SYMBOL_GPL(vmbus_sendpacket_mpb_desc); | |
1142 | ||
c88c4e4c | 1143 | /** |
fe857bb4 DC |
1144 | * __vmbus_recvpacket() - Retrieve the user packet on the specified channel |
1145 | * @channel: Pointer to vmbus_channel structure | |
39d70a4a | 1146 | * @buffer: Pointer to the buffer you want to receive the data into. |
fe857bb4 DC |
1147 | * @bufferlen: Maximum size of what the buffer can hold. |
1148 | * @buffer_actual_len: The actual size of the data after it was received. | |
39d70a4a | 1149 | * @requestid: Identifier of the request |
fe857bb4 | 1150 | * @raw: true means keep the vmpacket_descriptor header in the received data. |
c88c4e4c HJ |
1151 | * |
1152 | * Receives directly from the hyper-v vmbus and puts the data it received | |
1153 | * into Buffer. This will receive the data unparsed from hyper-v. | |
1154 | * | |
1155 | * Mainly used by Hyper-V drivers. | |
f4266e34 | 1156 | */ |
667d3740 VK |
1157 | static inline int |
1158 | __vmbus_recvpacket(struct vmbus_channel *channel, void *buffer, | |
1159 | u32 bufferlen, u32 *buffer_actual_len, u64 *requestid, | |
1160 | bool raw) | |
3e7ee490 | 1161 | { |
3372592a S |
1162 | return hv_ringbuffer_read(channel, buffer, bufferlen, |
1163 | buffer_actual_len, requestid, raw); | |
3e7ee490 | 1164 | |
667d3740 VK |
1165 | } |
1166 | ||
1167 | int vmbus_recvpacket(struct vmbus_channel *channel, void *buffer, | |
1168 | u32 bufferlen, u32 *buffer_actual_len, | |
1169 | u64 *requestid) | |
1170 | { | |
1171 | return __vmbus_recvpacket(channel, buffer, bufferlen, | |
1172 | buffer_actual_len, requestid, false); | |
3e7ee490 | 1173 | } |
fff41b2e | 1174 | EXPORT_SYMBOL(vmbus_recvpacket); |
3e7ee490 | 1175 | |
3e189519 | 1176 | /* |
fff41b2e | 1177 | * vmbus_recvpacket_raw - Retrieve the raw packet on the specified channel |
f4266e34 | 1178 | */ |
fff41b2e | 1179 | int vmbus_recvpacket_raw(struct vmbus_channel *channel, void *buffer, |
39d70a4a HZ |
1180 | u32 bufferlen, u32 *buffer_actual_len, |
1181 | u64 *requestid) | |
3e7ee490 | 1182 | { |
667d3740 VK |
1183 | return __vmbus_recvpacket(channel, buffer, bufferlen, |
1184 | buffer_actual_len, requestid, true); | |
3e7ee490 | 1185 | } |
adaee6bd | 1186 | EXPORT_SYMBOL_GPL(vmbus_recvpacket_raw); |
e8b7db38 AB |
1187 | |
1188 | /* | |
1189 | * vmbus_next_request_id - Returns a new request id. It is also | |
1190 | * the index at which the guest memory address is stored. | |
1191 | * Uses a spin lock to avoid race conditions. | |
1192 | * @rqstor: Pointer to the requestor struct | |
1193 | * @rqst_add: Guest memory address to be stored in the array | |
1194 | */ | |
1195 | u64 vmbus_next_request_id(struct vmbus_requestor *rqstor, u64 rqst_addr) | |
1196 | { | |
1197 | unsigned long flags; | |
1198 | u64 current_id; | |
1199 | const struct vmbus_channel *channel = | |
1200 | container_of(rqstor, const struct vmbus_channel, requestor); | |
1201 | ||
1202 | /* Check rqstor has been initialized */ | |
1203 | if (!channel->rqstor_size) | |
1204 | return VMBUS_NO_RQSTOR; | |
1205 | ||
1206 | spin_lock_irqsave(&rqstor->req_lock, flags); | |
1207 | current_id = rqstor->next_request_id; | |
1208 | ||
1209 | /* Requestor array is full */ | |
1210 | if (current_id >= rqstor->size) { | |
1211 | spin_unlock_irqrestore(&rqstor->req_lock, flags); | |
1212 | return VMBUS_RQST_ERROR; | |
1213 | } | |
1214 | ||
1215 | rqstor->next_request_id = rqstor->req_arr[current_id]; | |
1216 | rqstor->req_arr[current_id] = rqst_addr; | |
1217 | ||
1218 | /* The already held spin lock provides atomicity */ | |
1219 | bitmap_set(rqstor->req_bitmap, current_id, 1); | |
1220 | ||
1221 | spin_unlock_irqrestore(&rqstor->req_lock, flags); | |
1222 | ||
1223 | /* | |
1224 | * Cannot return an ID of 0, which is reserved for an unsolicited | |
1225 | * message from Hyper-V. | |
1226 | */ | |
1227 | return current_id + 1; | |
1228 | } | |
1229 | EXPORT_SYMBOL_GPL(vmbus_next_request_id); | |
1230 | ||
1231 | /* | |
1232 | * vmbus_request_addr - Returns the memory address stored at @trans_id | |
1233 | * in @rqstor. Uses a spin lock to avoid race conditions. | |
1234 | * @rqstor: Pointer to the requestor struct | |
1235 | * @trans_id: Request id sent back from Hyper-V. Becomes the requestor's | |
1236 | * next request id. | |
1237 | */ | |
1238 | u64 vmbus_request_addr(struct vmbus_requestor *rqstor, u64 trans_id) | |
1239 | { | |
1240 | unsigned long flags; | |
1241 | u64 req_addr; | |
1242 | const struct vmbus_channel *channel = | |
1243 | container_of(rqstor, const struct vmbus_channel, requestor); | |
1244 | ||
1245 | /* Check rqstor has been initialized */ | |
1246 | if (!channel->rqstor_size) | |
1247 | return VMBUS_NO_RQSTOR; | |
1248 | ||
1249 | /* Hyper-V can send an unsolicited message with ID of 0 */ | |
1250 | if (!trans_id) | |
1251 | return trans_id; | |
1252 | ||
1253 | spin_lock_irqsave(&rqstor->req_lock, flags); | |
1254 | ||
1255 | /* Data corresponding to trans_id is stored at trans_id - 1 */ | |
1256 | trans_id--; | |
1257 | ||
1258 | /* Invalid trans_id */ | |
1259 | if (trans_id >= rqstor->size || !test_bit(trans_id, rqstor->req_bitmap)) { | |
1260 | spin_unlock_irqrestore(&rqstor->req_lock, flags); | |
1261 | return VMBUS_RQST_ERROR; | |
1262 | } | |
1263 | ||
1264 | req_addr = rqstor->req_arr[trans_id]; | |
1265 | rqstor->req_arr[trans_id] = rqstor->next_request_id; | |
1266 | rqstor->next_request_id = trans_id; | |
1267 | ||
1268 | /* The already held spin lock provides atomicity */ | |
1269 | bitmap_clear(rqstor->req_bitmap, trans_id, 1); | |
1270 | ||
1271 | spin_unlock_irqrestore(&rqstor->req_lock, flags); | |
1272 | return req_addr; | |
1273 | } | |
1274 | EXPORT_SYMBOL_GPL(vmbus_request_addr); |