2 * Copyright (c) 2005 Topspin Communications. All rights reserved.
3 * Copyright (c) 2005 Cisco Systems. All rights reserved.
4 * Copyright (c) 2005 PathScale, Inc. All rights reserved.
6 * This software is available to you under a choice of one of two
7 * licenses. You may choose to be licensed under the terms of the GNU
8 * General Public License (GPL) Version 2, available from the file
9 * COPYING in the main directory of this source tree, or the
10 * OpenIB.org BSD license below:
12 * Redistribution and use in source and binary forms, with or
13 * without modification, are permitted provided that the following
16 * - Redistributions of source code must retain the above
17 * copyright notice, this list of conditions and the following
20 * - Redistributions in binary form must reproduce the above
21 * copyright notice, this list of conditions and the following
22 * disclaimer in the documentation and/or other materials
23 * provided with the distribution.
25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 * $Id: uverbs_cmd.c 2708 2005-06-24 17:27:21Z roland $
37 #include <linux/file.h>
39 #include <asm/uaccess.h>
43 #define INIT_UDATA(udata, ibuf, obuf, ilen, olen) \
45 (udata)->inbuf = (void __user *) (ibuf); \
46 (udata)->outbuf = (void __user *) (obuf); \
47 (udata)->inlen = (ilen); \
48 (udata)->outlen = (olen); \
51 ssize_t ib_uverbs_get_context(struct ib_uverbs_file *file,
52 const char __user *buf,
53 int in_len, int out_len)
55 struct ib_uverbs_get_context cmd;
56 struct ib_uverbs_get_context_resp resp;
57 struct ib_udata udata;
58 struct ib_device *ibdev = file->device->ib_dev;
59 struct ib_ucontext *ucontext;
63 if (out_len < sizeof resp)
66 if (copy_from_user(&cmd, buf, sizeof cmd))
76 INIT_UDATA(&udata, buf + sizeof cmd,
77 (unsigned long) cmd.response + sizeof resp,
78 in_len - sizeof cmd, out_len - sizeof resp);
80 ucontext = ibdev->alloc_ucontext(ibdev, &udata);
82 return PTR_ERR(file->ucontext);
84 ucontext->device = ibdev;
85 INIT_LIST_HEAD(&ucontext->pd_list);
86 INIT_LIST_HEAD(&ucontext->mr_list);
87 INIT_LIST_HEAD(&ucontext->mw_list);
88 INIT_LIST_HEAD(&ucontext->cq_list);
89 INIT_LIST_HEAD(&ucontext->qp_list);
90 INIT_LIST_HEAD(&ucontext->srq_list);
91 INIT_LIST_HEAD(&ucontext->ah_list);
93 resp.num_comp_vectors = file->device->num_comp_vectors;
95 filp = ib_uverbs_alloc_event_file(file, 1, &resp.async_fd);
101 if (copy_to_user((void __user *) (unsigned long) cmd.response,
102 &resp, sizeof resp)) {
107 file->async_file = filp->private_data;
109 INIT_IB_EVENT_HANDLER(&file->event_handler, file->device->ib_dev,
110 ib_uverbs_event_handler);
111 ret = ib_register_event_handler(&file->event_handler);
115 kref_get(&file->async_file->ref);
116 kref_get(&file->ref);
117 file->ucontext = ucontext;
119 fd_install(resp.async_fd, filp);
126 put_unused_fd(resp.async_fd);
130 ibdev->dealloc_ucontext(ucontext);
137 ssize_t ib_uverbs_query_device(struct ib_uverbs_file *file,
138 const char __user *buf,
139 int in_len, int out_len)
141 struct ib_uverbs_query_device cmd;
142 struct ib_uverbs_query_device_resp resp;
143 struct ib_device_attr attr;
146 if (out_len < sizeof resp)
149 if (copy_from_user(&cmd, buf, sizeof cmd))
152 ret = ib_query_device(file->device->ib_dev, &attr);
156 memset(&resp, 0, sizeof resp);
158 resp.fw_ver = attr.fw_ver;
159 resp.node_guid = attr.node_guid;
160 resp.sys_image_guid = attr.sys_image_guid;
161 resp.max_mr_size = attr.max_mr_size;
162 resp.page_size_cap = attr.page_size_cap;
163 resp.vendor_id = attr.vendor_id;
164 resp.vendor_part_id = attr.vendor_part_id;
165 resp.hw_ver = attr.hw_ver;
166 resp.max_qp = attr.max_qp;
167 resp.max_qp_wr = attr.max_qp_wr;
168 resp.device_cap_flags = attr.device_cap_flags;
169 resp.max_sge = attr.max_sge;
170 resp.max_sge_rd = attr.max_sge_rd;
171 resp.max_cq = attr.max_cq;
172 resp.max_cqe = attr.max_cqe;
173 resp.max_mr = attr.max_mr;
174 resp.max_pd = attr.max_pd;
175 resp.max_qp_rd_atom = attr.max_qp_rd_atom;
176 resp.max_ee_rd_atom = attr.max_ee_rd_atom;
177 resp.max_res_rd_atom = attr.max_res_rd_atom;
178 resp.max_qp_init_rd_atom = attr.max_qp_init_rd_atom;
179 resp.max_ee_init_rd_atom = attr.max_ee_init_rd_atom;
180 resp.atomic_cap = attr.atomic_cap;
181 resp.max_ee = attr.max_ee;
182 resp.max_rdd = attr.max_rdd;
183 resp.max_mw = attr.max_mw;
184 resp.max_raw_ipv6_qp = attr.max_raw_ipv6_qp;
185 resp.max_raw_ethy_qp = attr.max_raw_ethy_qp;
186 resp.max_mcast_grp = attr.max_mcast_grp;
187 resp.max_mcast_qp_attach = attr.max_mcast_qp_attach;
188 resp.max_total_mcast_qp_attach = attr.max_total_mcast_qp_attach;
189 resp.max_ah = attr.max_ah;
190 resp.max_fmr = attr.max_fmr;
191 resp.max_map_per_fmr = attr.max_map_per_fmr;
192 resp.max_srq = attr.max_srq;
193 resp.max_srq_wr = attr.max_srq_wr;
194 resp.max_srq_sge = attr.max_srq_sge;
195 resp.max_pkeys = attr.max_pkeys;
196 resp.local_ca_ack_delay = attr.local_ca_ack_delay;
197 resp.phys_port_cnt = file->device->ib_dev->phys_port_cnt;
199 if (copy_to_user((void __user *) (unsigned long) cmd.response,
206 ssize_t ib_uverbs_query_port(struct ib_uverbs_file *file,
207 const char __user *buf,
208 int in_len, int out_len)
210 struct ib_uverbs_query_port cmd;
211 struct ib_uverbs_query_port_resp resp;
212 struct ib_port_attr attr;
215 if (out_len < sizeof resp)
218 if (copy_from_user(&cmd, buf, sizeof cmd))
221 ret = ib_query_port(file->device->ib_dev, cmd.port_num, &attr);
225 memset(&resp, 0, sizeof resp);
227 resp.state = attr.state;
228 resp.max_mtu = attr.max_mtu;
229 resp.active_mtu = attr.active_mtu;
230 resp.gid_tbl_len = attr.gid_tbl_len;
231 resp.port_cap_flags = attr.port_cap_flags;
232 resp.max_msg_sz = attr.max_msg_sz;
233 resp.bad_pkey_cntr = attr.bad_pkey_cntr;
234 resp.qkey_viol_cntr = attr.qkey_viol_cntr;
235 resp.pkey_tbl_len = attr.pkey_tbl_len;
237 resp.sm_lid = attr.sm_lid;
239 resp.max_vl_num = attr.max_vl_num;
240 resp.sm_sl = attr.sm_sl;
241 resp.subnet_timeout = attr.subnet_timeout;
242 resp.init_type_reply = attr.init_type_reply;
243 resp.active_width = attr.active_width;
244 resp.active_speed = attr.active_speed;
245 resp.phys_state = attr.phys_state;
247 if (copy_to_user((void __user *) (unsigned long) cmd.response,
254 ssize_t ib_uverbs_alloc_pd(struct ib_uverbs_file *file,
255 const char __user *buf,
256 int in_len, int out_len)
258 struct ib_uverbs_alloc_pd cmd;
259 struct ib_uverbs_alloc_pd_resp resp;
260 struct ib_udata udata;
261 struct ib_uobject *uobj;
265 if (out_len < sizeof resp)
268 if (copy_from_user(&cmd, buf, sizeof cmd))
271 INIT_UDATA(&udata, buf + sizeof cmd,
272 (unsigned long) cmd.response + sizeof resp,
273 in_len - sizeof cmd, out_len - sizeof resp);
275 uobj = kmalloc(sizeof *uobj, GFP_KERNEL);
279 uobj->context = file->ucontext;
281 pd = file->device->ib_dev->alloc_pd(file->device->ib_dev,
282 file->ucontext, &udata);
288 pd->device = file->device->ib_dev;
290 atomic_set(&pd->usecnt, 0);
292 down(&ib_uverbs_idr_mutex);
295 if (!idr_pre_get(&ib_uverbs_pd_idr, GFP_KERNEL)) {
300 ret = idr_get_new(&ib_uverbs_pd_idr, pd, &uobj->id);
307 memset(&resp, 0, sizeof resp);
308 resp.pd_handle = uobj->id;
310 if (copy_to_user((void __user *) (unsigned long) cmd.response,
311 &resp, sizeof resp)) {
317 list_add_tail(&uobj->list, &file->ucontext->pd_list);
320 up(&ib_uverbs_idr_mutex);
325 idr_remove(&ib_uverbs_pd_idr, uobj->id);
328 up(&ib_uverbs_idr_mutex);
336 ssize_t ib_uverbs_dealloc_pd(struct ib_uverbs_file *file,
337 const char __user *buf,
338 int in_len, int out_len)
340 struct ib_uverbs_dealloc_pd cmd;
342 struct ib_uobject *uobj;
345 if (copy_from_user(&cmd, buf, sizeof cmd))
348 down(&ib_uverbs_idr_mutex);
350 pd = idr_find(&ib_uverbs_pd_idr, cmd.pd_handle);
351 if (!pd || pd->uobject->context != file->ucontext)
356 ret = ib_dealloc_pd(pd);
360 idr_remove(&ib_uverbs_pd_idr, cmd.pd_handle);
363 list_del(&uobj->list);
369 up(&ib_uverbs_idr_mutex);
371 return ret ? ret : in_len;
374 ssize_t ib_uverbs_reg_mr(struct ib_uverbs_file *file,
375 const char __user *buf, int in_len,
378 struct ib_uverbs_reg_mr cmd;
379 struct ib_uverbs_reg_mr_resp resp;
380 struct ib_udata udata;
381 struct ib_umem_object *obj;
386 if (out_len < sizeof resp)
389 if (copy_from_user(&cmd, buf, sizeof cmd))
392 INIT_UDATA(&udata, buf + sizeof cmd,
393 (unsigned long) cmd.response + sizeof resp,
394 in_len - sizeof cmd, out_len - sizeof resp);
396 if ((cmd.start & ~PAGE_MASK) != (cmd.hca_va & ~PAGE_MASK))
400 * Local write permission is required if remote write or
401 * remote atomic permission is also requested.
403 if (cmd.access_flags & (IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_REMOTE_WRITE) &&
404 !(cmd.access_flags & IB_ACCESS_LOCAL_WRITE))
407 obj = kmalloc(sizeof *obj, GFP_KERNEL);
411 obj->uobject.context = file->ucontext;
414 * We ask for writable memory if any access flags other than
415 * "remote read" are set. "Local write" and "remote write"
416 * obviously require write access. "Remote atomic" can do
417 * things like fetch and add, which will modify memory, and
418 * "MW bind" can change permissions by binding a window.
420 ret = ib_umem_get(file->device->ib_dev, &obj->umem,
421 (void *) (unsigned long) cmd.start, cmd.length,
422 !!(cmd.access_flags & ~IB_ACCESS_REMOTE_READ));
426 obj->umem.virt_base = cmd.hca_va;
428 down(&ib_uverbs_idr_mutex);
430 pd = idr_find(&ib_uverbs_pd_idr, cmd.pd_handle);
431 if (!pd || pd->uobject->context != file->ucontext) {
436 if (!pd->device->reg_user_mr) {
441 mr = pd->device->reg_user_mr(pd, &obj->umem, cmd.access_flags, &udata);
447 mr->device = pd->device;
449 mr->uobject = &obj->uobject;
450 atomic_inc(&pd->usecnt);
451 atomic_set(&mr->usecnt, 0);
453 memset(&resp, 0, sizeof resp);
454 resp.lkey = mr->lkey;
455 resp.rkey = mr->rkey;
458 if (!idr_pre_get(&ib_uverbs_mr_idr, GFP_KERNEL)) {
463 ret = idr_get_new(&ib_uverbs_mr_idr, mr, &obj->uobject.id);
470 resp.mr_handle = obj->uobject.id;
472 if (copy_to_user((void __user *) (unsigned long) cmd.response,
473 &resp, sizeof resp)) {
479 list_add_tail(&obj->uobject.list, &file->ucontext->mr_list);
482 up(&ib_uverbs_idr_mutex);
487 idr_remove(&ib_uverbs_mr_idr, obj->uobject.id);
493 up(&ib_uverbs_idr_mutex);
495 ib_umem_release(file->device->ib_dev, &obj->umem);
502 ssize_t ib_uverbs_dereg_mr(struct ib_uverbs_file *file,
503 const char __user *buf, int in_len,
506 struct ib_uverbs_dereg_mr cmd;
508 struct ib_umem_object *memobj;
511 if (copy_from_user(&cmd, buf, sizeof cmd))
514 down(&ib_uverbs_idr_mutex);
516 mr = idr_find(&ib_uverbs_mr_idr, cmd.mr_handle);
517 if (!mr || mr->uobject->context != file->ucontext)
520 memobj = container_of(mr->uobject, struct ib_umem_object, uobject);
522 ret = ib_dereg_mr(mr);
526 idr_remove(&ib_uverbs_mr_idr, cmd.mr_handle);
529 list_del(&memobj->uobject.list);
532 ib_umem_release(file->device->ib_dev, &memobj->umem);
536 up(&ib_uverbs_idr_mutex);
538 return ret ? ret : in_len;
541 ssize_t ib_uverbs_create_comp_channel(struct ib_uverbs_file *file,
542 const char __user *buf, int in_len,
545 struct ib_uverbs_create_comp_channel cmd;
546 struct ib_uverbs_create_comp_channel_resp resp;
549 if (out_len < sizeof resp)
552 if (copy_from_user(&cmd, buf, sizeof cmd))
555 filp = ib_uverbs_alloc_event_file(file, 0, &resp.fd);
557 return PTR_ERR(filp);
559 if (copy_to_user((void __user *) (unsigned long) cmd.response,
560 &resp, sizeof resp)) {
561 put_unused_fd(resp.fd);
566 fd_install(resp.fd, filp);
570 ssize_t ib_uverbs_create_cq(struct ib_uverbs_file *file,
571 const char __user *buf, int in_len,
574 struct ib_uverbs_create_cq cmd;
575 struct ib_uverbs_create_cq_resp resp;
576 struct ib_udata udata;
577 struct ib_ucq_object *uobj;
578 struct ib_uverbs_event_file *ev_file = NULL;
582 if (out_len < sizeof resp)
585 if (copy_from_user(&cmd, buf, sizeof cmd))
588 INIT_UDATA(&udata, buf + sizeof cmd,
589 (unsigned long) cmd.response + sizeof resp,
590 in_len - sizeof cmd, out_len - sizeof resp);
592 if (cmd.comp_vector >= file->device->num_comp_vectors)
595 if (cmd.comp_channel >= 0)
596 ev_file = ib_uverbs_lookup_comp_file(cmd.comp_channel);
598 uobj = kmalloc(sizeof *uobj, GFP_KERNEL);
602 uobj->uobject.user_handle = cmd.user_handle;
603 uobj->uobject.context = file->ucontext;
604 uobj->comp_events_reported = 0;
605 uobj->async_events_reported = 0;
606 INIT_LIST_HEAD(&uobj->comp_list);
607 INIT_LIST_HEAD(&uobj->async_list);
609 cq = file->device->ib_dev->create_cq(file->device->ib_dev, cmd.cqe,
610 file->ucontext, &udata);
616 cq->device = file->device->ib_dev;
617 cq->uobject = &uobj->uobject;
618 cq->comp_handler = ib_uverbs_comp_handler;
619 cq->event_handler = ib_uverbs_cq_event_handler;
620 cq->cq_context = ev_file;
621 atomic_set(&cq->usecnt, 0);
623 down(&ib_uverbs_idr_mutex);
626 if (!idr_pre_get(&ib_uverbs_cq_idr, GFP_KERNEL)) {
631 ret = idr_get_new(&ib_uverbs_cq_idr, cq, &uobj->uobject.id);
638 memset(&resp, 0, sizeof resp);
639 resp.cq_handle = uobj->uobject.id;
642 if (copy_to_user((void __user *) (unsigned long) cmd.response,
643 &resp, sizeof resp)) {
649 list_add_tail(&uobj->uobject.list, &file->ucontext->cq_list);
652 up(&ib_uverbs_idr_mutex);
657 idr_remove(&ib_uverbs_cq_idr, uobj->uobject.id);
660 up(&ib_uverbs_idr_mutex);
668 ssize_t ib_uverbs_poll_cq(struct ib_uverbs_file *file,
669 const char __user *buf, int in_len,
672 struct ib_uverbs_poll_cq cmd;
673 struct ib_uverbs_poll_cq_resp *resp;
680 if (copy_from_user(&cmd, buf, sizeof cmd))
683 wc = kmalloc(cmd.ne * sizeof *wc, GFP_KERNEL);
687 rsize = sizeof *resp + cmd.ne * sizeof(struct ib_uverbs_wc);
688 resp = kmalloc(rsize, GFP_KERNEL);
694 down(&ib_uverbs_idr_mutex);
695 cq = idr_find(&ib_uverbs_cq_idr, cmd.cq_handle);
696 if (!cq || cq->uobject->context != file->ucontext) {
701 resp->count = ib_poll_cq(cq, cmd.ne, wc);
703 for (i = 0; i < resp->count; i++) {
704 resp->wc[i].wr_id = wc[i].wr_id;
705 resp->wc[i].status = wc[i].status;
706 resp->wc[i].opcode = wc[i].opcode;
707 resp->wc[i].vendor_err = wc[i].vendor_err;
708 resp->wc[i].byte_len = wc[i].byte_len;
709 resp->wc[i].imm_data = wc[i].imm_data;
710 resp->wc[i].qp_num = wc[i].qp_num;
711 resp->wc[i].src_qp = wc[i].src_qp;
712 resp->wc[i].wc_flags = wc[i].wc_flags;
713 resp->wc[i].pkey_index = wc[i].pkey_index;
714 resp->wc[i].slid = wc[i].slid;
715 resp->wc[i].sl = wc[i].sl;
716 resp->wc[i].dlid_path_bits = wc[i].dlid_path_bits;
717 resp->wc[i].port_num = wc[i].port_num;
720 if (copy_to_user((void __user *) (unsigned long) cmd.response, resp, rsize))
724 up(&ib_uverbs_idr_mutex);
729 return ret ? ret : in_len;
732 ssize_t ib_uverbs_req_notify_cq(struct ib_uverbs_file *file,
733 const char __user *buf, int in_len,
736 struct ib_uverbs_req_notify_cq cmd;
740 if (copy_from_user(&cmd, buf, sizeof cmd))
743 down(&ib_uverbs_idr_mutex);
744 cq = idr_find(&ib_uverbs_cq_idr, cmd.cq_handle);
745 if (cq && cq->uobject->context == file->ucontext) {
746 ib_req_notify_cq(cq, cmd.solicited_only ?
747 IB_CQ_SOLICITED : IB_CQ_NEXT_COMP);
750 up(&ib_uverbs_idr_mutex);
755 ssize_t ib_uverbs_destroy_cq(struct ib_uverbs_file *file,
756 const char __user *buf, int in_len,
759 struct ib_uverbs_destroy_cq cmd;
760 struct ib_uverbs_destroy_cq_resp resp;
762 struct ib_ucq_object *uobj;
763 struct ib_uverbs_event_file *ev_file;
764 struct ib_uverbs_event *evt, *tmp;
768 if (copy_from_user(&cmd, buf, sizeof cmd))
771 memset(&resp, 0, sizeof resp);
773 down(&ib_uverbs_idr_mutex);
775 cq = idr_find(&ib_uverbs_cq_idr, cmd.cq_handle);
776 if (!cq || cq->uobject->context != file->ucontext)
779 user_handle = cq->uobject->user_handle;
780 uobj = container_of(cq->uobject, struct ib_ucq_object, uobject);
781 ev_file = cq->cq_context;
783 ret = ib_destroy_cq(cq);
787 idr_remove(&ib_uverbs_cq_idr, cmd.cq_handle);
790 list_del(&uobj->uobject.list);
794 spin_lock_irq(&ev_file->lock);
795 list_for_each_entry_safe(evt, tmp, &uobj->comp_list, obj_list) {
796 list_del(&evt->list);
799 spin_unlock_irq(&ev_file->lock);
801 kref_put(&ev_file->ref, ib_uverbs_release_event_file);
804 spin_lock_irq(&file->async_file->lock);
805 list_for_each_entry_safe(evt, tmp, &uobj->async_list, obj_list) {
806 list_del(&evt->list);
809 spin_unlock_irq(&file->async_file->lock);
811 resp.comp_events_reported = uobj->comp_events_reported;
812 resp.async_events_reported = uobj->async_events_reported;
816 if (copy_to_user((void __user *) (unsigned long) cmd.response,
821 up(&ib_uverbs_idr_mutex);
823 return ret ? ret : in_len;
826 ssize_t ib_uverbs_create_qp(struct ib_uverbs_file *file,
827 const char __user *buf, int in_len,
830 struct ib_uverbs_create_qp cmd;
831 struct ib_uverbs_create_qp_resp resp;
832 struct ib_udata udata;
833 struct ib_uevent_object *uobj;
835 struct ib_cq *scq, *rcq;
838 struct ib_qp_init_attr attr;
841 if (out_len < sizeof resp)
844 if (copy_from_user(&cmd, buf, sizeof cmd))
847 INIT_UDATA(&udata, buf + sizeof cmd,
848 (unsigned long) cmd.response + sizeof resp,
849 in_len - sizeof cmd, out_len - sizeof resp);
851 uobj = kmalloc(sizeof *uobj, GFP_KERNEL);
855 down(&ib_uverbs_idr_mutex);
857 pd = idr_find(&ib_uverbs_pd_idr, cmd.pd_handle);
858 scq = idr_find(&ib_uverbs_cq_idr, cmd.send_cq_handle);
859 rcq = idr_find(&ib_uverbs_cq_idr, cmd.recv_cq_handle);
860 srq = cmd.is_srq ? idr_find(&ib_uverbs_srq_idr, cmd.srq_handle) : NULL;
862 if (!pd || pd->uobject->context != file->ucontext ||
863 !scq || scq->uobject->context != file->ucontext ||
864 !rcq || rcq->uobject->context != file->ucontext ||
865 (cmd.is_srq && (!srq || srq->uobject->context != file->ucontext))) {
870 attr.event_handler = ib_uverbs_qp_event_handler;
871 attr.qp_context = file;
875 attr.sq_sig_type = cmd.sq_sig_all ? IB_SIGNAL_ALL_WR : IB_SIGNAL_REQ_WR;
876 attr.qp_type = cmd.qp_type;
878 attr.cap.max_send_wr = cmd.max_send_wr;
879 attr.cap.max_recv_wr = cmd.max_recv_wr;
880 attr.cap.max_send_sge = cmd.max_send_sge;
881 attr.cap.max_recv_sge = cmd.max_recv_sge;
882 attr.cap.max_inline_data = cmd.max_inline_data;
884 uobj->uobject.user_handle = cmd.user_handle;
885 uobj->uobject.context = file->ucontext;
886 uobj->events_reported = 0;
887 INIT_LIST_HEAD(&uobj->event_list);
889 qp = pd->device->create_qp(pd, &attr, &udata);
895 qp->device = pd->device;
897 qp->send_cq = attr.send_cq;
898 qp->recv_cq = attr.recv_cq;
900 qp->uobject = &uobj->uobject;
901 qp->event_handler = attr.event_handler;
902 qp->qp_context = attr.qp_context;
903 qp->qp_type = attr.qp_type;
904 atomic_inc(&pd->usecnt);
905 atomic_inc(&attr.send_cq->usecnt);
906 atomic_inc(&attr.recv_cq->usecnt);
908 atomic_inc(&attr.srq->usecnt);
910 memset(&resp, 0, sizeof resp);
911 resp.qpn = qp->qp_num;
914 if (!idr_pre_get(&ib_uverbs_qp_idr, GFP_KERNEL)) {
919 ret = idr_get_new(&ib_uverbs_qp_idr, qp, &uobj->uobject.id);
926 resp.qp_handle = uobj->uobject.id;
928 if (copy_to_user((void __user *) (unsigned long) cmd.response,
929 &resp, sizeof resp)) {
935 list_add_tail(&uobj->uobject.list, &file->ucontext->qp_list);
938 up(&ib_uverbs_idr_mutex);
943 idr_remove(&ib_uverbs_qp_idr, uobj->uobject.id);
949 up(&ib_uverbs_idr_mutex);
955 ssize_t ib_uverbs_modify_qp(struct ib_uverbs_file *file,
956 const char __user *buf, int in_len,
959 struct ib_uverbs_modify_qp cmd;
961 struct ib_qp_attr *attr;
964 if (copy_from_user(&cmd, buf, sizeof cmd))
967 attr = kmalloc(sizeof *attr, GFP_KERNEL);
971 down(&ib_uverbs_idr_mutex);
973 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
974 if (!qp || qp->uobject->context != file->ucontext) {
979 attr->qp_state = cmd.qp_state;
980 attr->cur_qp_state = cmd.cur_qp_state;
981 attr->path_mtu = cmd.path_mtu;
982 attr->path_mig_state = cmd.path_mig_state;
983 attr->qkey = cmd.qkey;
984 attr->rq_psn = cmd.rq_psn;
985 attr->sq_psn = cmd.sq_psn;
986 attr->dest_qp_num = cmd.dest_qp_num;
987 attr->qp_access_flags = cmd.qp_access_flags;
988 attr->pkey_index = cmd.pkey_index;
989 attr->alt_pkey_index = cmd.pkey_index;
990 attr->en_sqd_async_notify = cmd.en_sqd_async_notify;
991 attr->max_rd_atomic = cmd.max_rd_atomic;
992 attr->max_dest_rd_atomic = cmd.max_dest_rd_atomic;
993 attr->min_rnr_timer = cmd.min_rnr_timer;
994 attr->port_num = cmd.port_num;
995 attr->timeout = cmd.timeout;
996 attr->retry_cnt = cmd.retry_cnt;
997 attr->rnr_retry = cmd.rnr_retry;
998 attr->alt_port_num = cmd.alt_port_num;
999 attr->alt_timeout = cmd.alt_timeout;
1001 memcpy(attr->ah_attr.grh.dgid.raw, cmd.dest.dgid, 16);
1002 attr->ah_attr.grh.flow_label = cmd.dest.flow_label;
1003 attr->ah_attr.grh.sgid_index = cmd.dest.sgid_index;
1004 attr->ah_attr.grh.hop_limit = cmd.dest.hop_limit;
1005 attr->ah_attr.grh.traffic_class = cmd.dest.traffic_class;
1006 attr->ah_attr.dlid = cmd.dest.dlid;
1007 attr->ah_attr.sl = cmd.dest.sl;
1008 attr->ah_attr.src_path_bits = cmd.dest.src_path_bits;
1009 attr->ah_attr.static_rate = cmd.dest.static_rate;
1010 attr->ah_attr.ah_flags = cmd.dest.is_global ? IB_AH_GRH : 0;
1011 attr->ah_attr.port_num = cmd.dest.port_num;
1013 memcpy(attr->alt_ah_attr.grh.dgid.raw, cmd.alt_dest.dgid, 16);
1014 attr->alt_ah_attr.grh.flow_label = cmd.alt_dest.flow_label;
1015 attr->alt_ah_attr.grh.sgid_index = cmd.alt_dest.sgid_index;
1016 attr->alt_ah_attr.grh.hop_limit = cmd.alt_dest.hop_limit;
1017 attr->alt_ah_attr.grh.traffic_class = cmd.alt_dest.traffic_class;
1018 attr->alt_ah_attr.dlid = cmd.alt_dest.dlid;
1019 attr->alt_ah_attr.sl = cmd.alt_dest.sl;
1020 attr->alt_ah_attr.src_path_bits = cmd.alt_dest.src_path_bits;
1021 attr->alt_ah_attr.static_rate = cmd.alt_dest.static_rate;
1022 attr->alt_ah_attr.ah_flags = cmd.alt_dest.is_global ? IB_AH_GRH : 0;
1023 attr->alt_ah_attr.port_num = cmd.alt_dest.port_num;
1025 ret = ib_modify_qp(qp, attr, cmd.attr_mask);
1032 up(&ib_uverbs_idr_mutex);
1038 ssize_t ib_uverbs_destroy_qp(struct ib_uverbs_file *file,
1039 const char __user *buf, int in_len,
1042 struct ib_uverbs_destroy_qp cmd;
1043 struct ib_uverbs_destroy_qp_resp resp;
1045 struct ib_uevent_object *uobj;
1046 struct ib_uverbs_event *evt, *tmp;
1049 if (copy_from_user(&cmd, buf, sizeof cmd))
1052 memset(&resp, 0, sizeof resp);
1054 down(&ib_uverbs_idr_mutex);
1056 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
1057 if (!qp || qp->uobject->context != file->ucontext)
1060 uobj = container_of(qp->uobject, struct ib_uevent_object, uobject);
1062 ret = ib_destroy_qp(qp);
1066 idr_remove(&ib_uverbs_qp_idr, cmd.qp_handle);
1069 list_del(&uobj->uobject.list);
1072 spin_lock_irq(&file->async_file->lock);
1073 list_for_each_entry_safe(evt, tmp, &uobj->event_list, obj_list) {
1074 list_del(&evt->list);
1077 spin_unlock_irq(&file->async_file->lock);
1079 resp.events_reported = uobj->events_reported;
1083 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1084 &resp, sizeof resp))
1088 up(&ib_uverbs_idr_mutex);
1090 return ret ? ret : in_len;
1093 ssize_t ib_uverbs_post_send(struct ib_uverbs_file *file,
1094 const char __user *buf, int in_len,
1097 struct ib_uverbs_post_send cmd;
1098 struct ib_uverbs_post_send_resp resp;
1099 struct ib_uverbs_send_wr *user_wr;
1100 struct ib_send_wr *wr = NULL, *last, *next, *bad_wr;
1103 ssize_t ret = -EINVAL;
1105 if (copy_from_user(&cmd, buf, sizeof cmd))
1108 if (in_len < sizeof cmd + cmd.wqe_size * cmd.wr_count +
1109 cmd.sge_count * sizeof (struct ib_uverbs_sge))
1112 if (cmd.wqe_size < sizeof (struct ib_uverbs_send_wr))
1115 user_wr = kmalloc(cmd.wqe_size, GFP_KERNEL);
1119 down(&ib_uverbs_idr_mutex);
1121 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
1122 if (!qp || qp->uobject->context != file->ucontext)
1127 for (i = 0; i < cmd.wr_count; ++i) {
1128 if (copy_from_user(user_wr,
1129 buf + sizeof cmd + i * cmd.wqe_size,
1135 if (user_wr->num_sge + sg_ind > cmd.sge_count) {
1140 next = kmalloc(ALIGN(sizeof *next, sizeof (struct ib_sge)) +
1141 user_wr->num_sge * sizeof (struct ib_sge),
1155 next->wr_id = user_wr->wr_id;
1156 next->num_sge = user_wr->num_sge;
1157 next->opcode = user_wr->opcode;
1158 next->send_flags = user_wr->send_flags;
1159 next->imm_data = user_wr->imm_data;
1161 if (qp->qp_type == IB_QPT_UD) {
1162 next->wr.ud.ah = idr_find(&ib_uverbs_ah_idr,
1164 if (!next->wr.ud.ah) {
1168 next->wr.ud.remote_qpn = user_wr->wr.ud.remote_qpn;
1169 next->wr.ud.remote_qkey = user_wr->wr.ud.remote_qkey;
1171 switch (next->opcode) {
1172 case IB_WR_RDMA_WRITE:
1173 case IB_WR_RDMA_WRITE_WITH_IMM:
1174 case IB_WR_RDMA_READ:
1175 next->wr.rdma.remote_addr =
1176 user_wr->wr.rdma.remote_addr;
1177 next->wr.rdma.rkey =
1178 user_wr->wr.rdma.rkey;
1180 case IB_WR_ATOMIC_CMP_AND_SWP:
1181 case IB_WR_ATOMIC_FETCH_AND_ADD:
1182 next->wr.atomic.remote_addr =
1183 user_wr->wr.atomic.remote_addr;
1184 next->wr.atomic.compare_add =
1185 user_wr->wr.atomic.compare_add;
1186 next->wr.atomic.swap = user_wr->wr.atomic.swap;
1187 next->wr.atomic.rkey = user_wr->wr.atomic.rkey;
1194 if (next->num_sge) {
1195 next->sg_list = (void *) next +
1196 ALIGN(sizeof *next, sizeof (struct ib_sge));
1197 if (copy_from_user(next->sg_list,
1199 cmd.wr_count * cmd.wqe_size +
1200 sg_ind * sizeof (struct ib_sge),
1201 next->num_sge * sizeof (struct ib_sge))) {
1205 sg_ind += next->num_sge;
1207 next->sg_list = NULL;
1211 ret = qp->device->post_send(qp, wr, &bad_wr);
1213 for (next = wr; next; next = next->next) {
1219 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1220 &resp, sizeof resp))
1224 up(&ib_uverbs_idr_mutex);
1234 return ret ? ret : in_len;
1237 static struct ib_recv_wr *ib_uverbs_unmarshall_recv(const char __user *buf,
1243 struct ib_uverbs_recv_wr *user_wr;
1244 struct ib_recv_wr *wr = NULL, *last, *next;
1249 if (in_len < wqe_size * wr_count +
1250 sge_count * sizeof (struct ib_uverbs_sge))
1251 return ERR_PTR(-EINVAL);
1253 if (wqe_size < sizeof (struct ib_uverbs_recv_wr))
1254 return ERR_PTR(-EINVAL);
1256 user_wr = kmalloc(wqe_size, GFP_KERNEL);
1258 return ERR_PTR(-ENOMEM);
1262 for (i = 0; i < wr_count; ++i) {
1263 if (copy_from_user(user_wr, buf + i * wqe_size,
1269 if (user_wr->num_sge + sg_ind > sge_count) {
1274 next = kmalloc(ALIGN(sizeof *next, sizeof (struct ib_sge)) +
1275 user_wr->num_sge * sizeof (struct ib_sge),
1289 next->wr_id = user_wr->wr_id;
1290 next->num_sge = user_wr->num_sge;
1292 if (next->num_sge) {
1293 next->sg_list = (void *) next +
1294 ALIGN(sizeof *next, sizeof (struct ib_sge));
1295 if (copy_from_user(next->sg_list,
1296 buf + wr_count * wqe_size +
1297 sg_ind * sizeof (struct ib_sge),
1298 next->num_sge * sizeof (struct ib_sge))) {
1302 sg_ind += next->num_sge;
1304 next->sg_list = NULL;
1319 return ERR_PTR(ret);
1322 ssize_t ib_uverbs_post_recv(struct ib_uverbs_file *file,
1323 const char __user *buf, int in_len,
1326 struct ib_uverbs_post_recv cmd;
1327 struct ib_uverbs_post_recv_resp resp;
1328 struct ib_recv_wr *wr, *next, *bad_wr;
1330 ssize_t ret = -EINVAL;
1332 if (copy_from_user(&cmd, buf, sizeof cmd))
1335 wr = ib_uverbs_unmarshall_recv(buf + sizeof cmd,
1336 in_len - sizeof cmd, cmd.wr_count,
1337 cmd.sge_count, cmd.wqe_size);
1341 down(&ib_uverbs_idr_mutex);
1343 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
1344 if (!qp || qp->uobject->context != file->ucontext)
1348 ret = qp->device->post_recv(qp, wr, &bad_wr);
1350 for (next = wr; next; next = next->next) {
1357 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1358 &resp, sizeof resp))
1362 up(&ib_uverbs_idr_mutex);
1370 return ret ? ret : in_len;
1373 ssize_t ib_uverbs_post_srq_recv(struct ib_uverbs_file *file,
1374 const char __user *buf, int in_len,
1377 struct ib_uverbs_post_srq_recv cmd;
1378 struct ib_uverbs_post_srq_recv_resp resp;
1379 struct ib_recv_wr *wr, *next, *bad_wr;
1381 ssize_t ret = -EINVAL;
1383 if (copy_from_user(&cmd, buf, sizeof cmd))
1386 wr = ib_uverbs_unmarshall_recv(buf + sizeof cmd,
1387 in_len - sizeof cmd, cmd.wr_count,
1388 cmd.sge_count, cmd.wqe_size);
1392 down(&ib_uverbs_idr_mutex);
1394 srq = idr_find(&ib_uverbs_srq_idr, cmd.srq_handle);
1395 if (!srq || srq->uobject->context != file->ucontext)
1399 ret = srq->device->post_srq_recv(srq, wr, &bad_wr);
1401 for (next = wr; next; next = next->next) {
1408 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1409 &resp, sizeof resp))
1413 up(&ib_uverbs_idr_mutex);
1421 return ret ? ret : in_len;
1424 ssize_t ib_uverbs_create_ah(struct ib_uverbs_file *file,
1425 const char __user *buf, int in_len,
1428 struct ib_uverbs_create_ah cmd;
1429 struct ib_uverbs_create_ah_resp resp;
1430 struct ib_uobject *uobj;
1433 struct ib_ah_attr attr;
1436 if (out_len < sizeof resp)
1439 if (copy_from_user(&cmd, buf, sizeof cmd))
1442 uobj = kmalloc(sizeof *uobj, GFP_KERNEL);
1446 down(&ib_uverbs_idr_mutex);
1448 pd = idr_find(&ib_uverbs_pd_idr, cmd.pd_handle);
1449 if (!pd || pd->uobject->context != file->ucontext) {
1454 uobj->user_handle = cmd.user_handle;
1455 uobj->context = file->ucontext;
1457 attr.dlid = cmd.attr.dlid;
1458 attr.sl = cmd.attr.sl;
1459 attr.src_path_bits = cmd.attr.src_path_bits;
1460 attr.static_rate = cmd.attr.static_rate;
1461 attr.port_num = cmd.attr.port_num;
1462 attr.grh.flow_label = cmd.attr.grh.flow_label;
1463 attr.grh.sgid_index = cmd.attr.grh.sgid_index;
1464 attr.grh.hop_limit = cmd.attr.grh.hop_limit;
1465 attr.grh.traffic_class = cmd.attr.grh.traffic_class;
1466 memcpy(attr.grh.dgid.raw, cmd.attr.grh.dgid, 16);
1468 ah = ib_create_ah(pd, &attr);
1477 if (!idr_pre_get(&ib_uverbs_ah_idr, GFP_KERNEL)) {
1482 ret = idr_get_new(&ib_uverbs_ah_idr, ah, &uobj->id);
1489 resp.ah_handle = uobj->id;
1491 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1492 &resp, sizeof resp)) {
1498 list_add_tail(&uobj->list, &file->ucontext->ah_list);
1501 up(&ib_uverbs_idr_mutex);
1506 idr_remove(&ib_uverbs_ah_idr, uobj->id);
1512 up(&ib_uverbs_idr_mutex);
1518 ssize_t ib_uverbs_destroy_ah(struct ib_uverbs_file *file,
1519 const char __user *buf, int in_len, int out_len)
1521 struct ib_uverbs_destroy_ah cmd;
1523 struct ib_uobject *uobj;
1526 if (copy_from_user(&cmd, buf, sizeof cmd))
1529 down(&ib_uverbs_idr_mutex);
1531 ah = idr_find(&ib_uverbs_ah_idr, cmd.ah_handle);
1532 if (!ah || ah->uobject->context != file->ucontext)
1537 ret = ib_destroy_ah(ah);
1541 idr_remove(&ib_uverbs_ah_idr, cmd.ah_handle);
1544 list_del(&uobj->list);
1550 up(&ib_uverbs_idr_mutex);
1552 return ret ? ret : in_len;
1555 ssize_t ib_uverbs_attach_mcast(struct ib_uverbs_file *file,
1556 const char __user *buf, int in_len,
1559 struct ib_uverbs_attach_mcast cmd;
1563 if (copy_from_user(&cmd, buf, sizeof cmd))
1566 down(&ib_uverbs_idr_mutex);
1568 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
1569 if (qp && qp->uobject->context == file->ucontext)
1570 ret = ib_attach_mcast(qp, (union ib_gid *) cmd.gid, cmd.mlid);
1572 up(&ib_uverbs_idr_mutex);
1574 return ret ? ret : in_len;
1577 ssize_t ib_uverbs_detach_mcast(struct ib_uverbs_file *file,
1578 const char __user *buf, int in_len,
1581 struct ib_uverbs_detach_mcast cmd;
1585 if (copy_from_user(&cmd, buf, sizeof cmd))
1588 down(&ib_uverbs_idr_mutex);
1590 qp = idr_find(&ib_uverbs_qp_idr, cmd.qp_handle);
1591 if (qp && qp->uobject->context == file->ucontext)
1592 ret = ib_detach_mcast(qp, (union ib_gid *) cmd.gid, cmd.mlid);
1594 up(&ib_uverbs_idr_mutex);
1596 return ret ? ret : in_len;
1599 ssize_t ib_uverbs_create_srq(struct ib_uverbs_file *file,
1600 const char __user *buf, int in_len,
1603 struct ib_uverbs_create_srq cmd;
1604 struct ib_uverbs_create_srq_resp resp;
1605 struct ib_udata udata;
1606 struct ib_uevent_object *uobj;
1609 struct ib_srq_init_attr attr;
1612 if (out_len < sizeof resp)
1615 if (copy_from_user(&cmd, buf, sizeof cmd))
1618 INIT_UDATA(&udata, buf + sizeof cmd,
1619 (unsigned long) cmd.response + sizeof resp,
1620 in_len - sizeof cmd, out_len - sizeof resp);
1622 uobj = kmalloc(sizeof *uobj, GFP_KERNEL);
1626 down(&ib_uverbs_idr_mutex);
1628 pd = idr_find(&ib_uverbs_pd_idr, cmd.pd_handle);
1630 if (!pd || pd->uobject->context != file->ucontext) {
1635 attr.event_handler = ib_uverbs_srq_event_handler;
1636 attr.srq_context = file;
1637 attr.attr.max_wr = cmd.max_wr;
1638 attr.attr.max_sge = cmd.max_sge;
1639 attr.attr.srq_limit = cmd.srq_limit;
1641 uobj->uobject.user_handle = cmd.user_handle;
1642 uobj->uobject.context = file->ucontext;
1643 uobj->events_reported = 0;
1644 INIT_LIST_HEAD(&uobj->event_list);
1646 srq = pd->device->create_srq(pd, &attr, &udata);
1652 srq->device = pd->device;
1654 srq->uobject = &uobj->uobject;
1655 srq->event_handler = attr.event_handler;
1656 srq->srq_context = attr.srq_context;
1657 atomic_inc(&pd->usecnt);
1658 atomic_set(&srq->usecnt, 0);
1660 memset(&resp, 0, sizeof resp);
1663 if (!idr_pre_get(&ib_uverbs_srq_idr, GFP_KERNEL)) {
1668 ret = idr_get_new(&ib_uverbs_srq_idr, srq, &uobj->uobject.id);
1675 resp.srq_handle = uobj->uobject.id;
1677 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1678 &resp, sizeof resp)) {
1684 list_add_tail(&uobj->uobject.list, &file->ucontext->srq_list);
1687 up(&ib_uverbs_idr_mutex);
1692 idr_remove(&ib_uverbs_srq_idr, uobj->uobject.id);
1695 ib_destroy_srq(srq);
1698 up(&ib_uverbs_idr_mutex);
1704 ssize_t ib_uverbs_modify_srq(struct ib_uverbs_file *file,
1705 const char __user *buf, int in_len,
1708 struct ib_uverbs_modify_srq cmd;
1710 struct ib_srq_attr attr;
1713 if (copy_from_user(&cmd, buf, sizeof cmd))
1716 down(&ib_uverbs_idr_mutex);
1718 srq = idr_find(&ib_uverbs_srq_idr, cmd.srq_handle);
1719 if (!srq || srq->uobject->context != file->ucontext) {
1724 attr.max_wr = cmd.max_wr;
1725 attr.max_sge = cmd.max_sge;
1726 attr.srq_limit = cmd.srq_limit;
1728 ret = ib_modify_srq(srq, &attr, cmd.attr_mask);
1731 up(&ib_uverbs_idr_mutex);
1733 return ret ? ret : in_len;
1736 ssize_t ib_uverbs_destroy_srq(struct ib_uverbs_file *file,
1737 const char __user *buf, int in_len,
1740 struct ib_uverbs_destroy_srq cmd;
1741 struct ib_uverbs_destroy_srq_resp resp;
1743 struct ib_uevent_object *uobj;
1744 struct ib_uverbs_event *evt, *tmp;
1747 if (copy_from_user(&cmd, buf, sizeof cmd))
1750 down(&ib_uverbs_idr_mutex);
1752 memset(&resp, 0, sizeof resp);
1754 srq = idr_find(&ib_uverbs_srq_idr, cmd.srq_handle);
1755 if (!srq || srq->uobject->context != file->ucontext)
1758 uobj = container_of(srq->uobject, struct ib_uevent_object, uobject);
1760 ret = ib_destroy_srq(srq);
1764 idr_remove(&ib_uverbs_srq_idr, cmd.srq_handle);
1767 list_del(&uobj->uobject.list);
1770 spin_lock_irq(&file->async_file->lock);
1771 list_for_each_entry_safe(evt, tmp, &uobj->event_list, obj_list) {
1772 list_del(&evt->list);
1775 spin_unlock_irq(&file->async_file->lock);
1777 resp.events_reported = uobj->events_reported;
1781 if (copy_to_user((void __user *) (unsigned long) cmd.response,
1782 &resp, sizeof resp))
1786 up(&ib_uverbs_idr_mutex);
1788 return ret ? ret : in_len;