]> asedeno.scripts.mit.edu Git - linux.git/blob - drivers/infiniband/core/uverbs_cmd.c
7f10eade76531017ba709b29aaecd29e39dce282
[linux.git] / drivers / infiniband / core / uverbs_cmd.c
1 /*
2  * Copyright (c) 2005 Topspin Communications.  All rights reserved.
3  * Copyright (c) 2005, 2006, 2007 Cisco Systems.  All rights reserved.
4  * Copyright (c) 2005 PathScale, Inc.  All rights reserved.
5  * Copyright (c) 2006 Mellanox Technologies.  All rights reserved.
6  *
7  * This software is available to you under a choice of one of two
8  * licenses.  You may choose to be licensed under the terms of the GNU
9  * General Public License (GPL) Version 2, available from the file
10  * COPYING in the main directory of this source tree, or the
11  * OpenIB.org BSD license below:
12  *
13  *     Redistribution and use in source and binary forms, with or
14  *     without modification, are permitted provided that the following
15  *     conditions are met:
16  *
17  *      - Redistributions of source code must retain the above
18  *        copyright notice, this list of conditions and the following
19  *        disclaimer.
20  *
21  *      - Redistributions in binary form must reproduce the above
22  *        copyright notice, this list of conditions and the following
23  *        disclaimer in the documentation and/or other materials
24  *        provided with the distribution.
25  *
26  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33  * SOFTWARE.
34  */
35
36 #include <linux/file.h>
37 #include <linux/fs.h>
38 #include <linux/slab.h>
39 #include <linux/sched.h>
40
41 #include <linux/uaccess.h>
42
43 #include <rdma/uverbs_types.h>
44 #include <rdma/uverbs_std_types.h>
45 #include "rdma_core.h"
46
47 #include "uverbs.h"
48 #include "core_priv.h"
49
50 /*
51  * Copy a response to userspace. If the provided 'resp' is larger than the
52  * user buffer it is silently truncated. If the user provided a larger buffer
53  * then the trailing portion is zero filled.
54  *
55  * These semantics are intended to support future extension of the output
56  * structures.
57  */
58 static int uverbs_response(struct uverbs_attr_bundle *attrs, const void *resp,
59                            size_t resp_len)
60 {
61         int ret;
62
63         if (copy_to_user(attrs->ucore.outbuf, resp,
64                          min(attrs->ucore.outlen, resp_len)))
65                 return -EFAULT;
66
67         if (resp_len < attrs->ucore.outlen) {
68                 /*
69                  * Zero fill any extra memory that user
70                  * space might have provided.
71                  */
72                 ret = clear_user(attrs->ucore.outbuf + resp_len,
73                                  attrs->ucore.outlen - resp_len);
74                 if (ret)
75                         return -EFAULT;
76         }
77
78         return 0;
79 }
80
81 /*
82  * Copy a request from userspace. If the provided 'req' is larger than the
83  * user buffer then the user buffer is zero extended into the 'req'. If 'req'
84  * is smaller than the user buffer then the uncopied bytes in the user buffer
85  * must be zero.
86  */
87 static int uverbs_request(struct uverbs_attr_bundle *attrs, void *req,
88                           size_t req_len)
89 {
90         if (copy_from_user(req, attrs->ucore.inbuf,
91                            min(attrs->ucore.inlen, req_len)))
92                 return -EFAULT;
93
94         if (attrs->ucore.inlen < req_len) {
95                 memset(req + attrs->ucore.inlen, 0,
96                        req_len - attrs->ucore.inlen);
97         } else if (attrs->ucore.inlen > req_len) {
98                 if (!ib_is_buffer_cleared(attrs->ucore.inbuf + req_len,
99                                           attrs->ucore.inlen - req_len))
100                         return -EOPNOTSUPP;
101         }
102         return 0;
103 }
104
105 /*
106  * Generate the value for the 'response_length' protocol used by write_ex.
107  * This is the number of bytes the kernel actually wrote. Userspace can use
108  * this to detect what structure members in the response the kernel
109  * understood.
110  */
111 static u32 uverbs_response_length(struct uverbs_attr_bundle *attrs,
112                                   size_t resp_len)
113 {
114         return min_t(size_t, attrs->ucore.outlen, resp_len);
115 }
116
117 /*
118  * The iterator version of the request interface is for handlers that need to
119  * step over a flex array at the end of a command header.
120  */
121 struct uverbs_req_iter {
122         const void __user *cur;
123         const void __user *end;
124 };
125
126 static int uverbs_request_start(struct uverbs_attr_bundle *attrs,
127                                 struct uverbs_req_iter *iter,
128                                 void *req,
129                                 size_t req_len)
130 {
131         if (attrs->ucore.inlen < req_len)
132                 return -ENOSPC;
133
134         if (copy_from_user(req, attrs->ucore.inbuf, req_len))
135                 return -EFAULT;
136
137         iter->cur = attrs->ucore.inbuf + req_len;
138         iter->end = attrs->ucore.inbuf + attrs->ucore.inlen;
139         return 0;
140 }
141
142 static int uverbs_request_next(struct uverbs_req_iter *iter, void *val,
143                                size_t len)
144 {
145         if (iter->cur + len > iter->end)
146                 return -ENOSPC;
147
148         if (copy_from_user(val, iter->cur, len))
149                 return -EFAULT;
150
151         iter->cur += len;
152         return 0;
153 }
154
155 static const void __user *uverbs_request_next_ptr(struct uverbs_req_iter *iter,
156                                                   size_t len)
157 {
158         const void __user *res = iter->cur;
159
160         if (iter->cur + len > iter->end)
161                 return ERR_PTR(-ENOSPC);
162         iter->cur += len;
163         return res;
164 }
165
166 static int uverbs_request_finish(struct uverbs_req_iter *iter)
167 {
168         if (!ib_is_buffer_cleared(iter->cur, iter->end - iter->cur))
169                 return -EOPNOTSUPP;
170         return 0;
171 }
172
173 static struct ib_uverbs_completion_event_file *
174 _ib_uverbs_lookup_comp_file(s32 fd, const struct uverbs_attr_bundle *attrs)
175 {
176         struct ib_uobject *uobj = ufd_get_read(UVERBS_OBJECT_COMP_CHANNEL,
177                                                fd, attrs);
178
179         if (IS_ERR(uobj))
180                 return (void *)uobj;
181
182         uverbs_uobject_get(uobj);
183         uobj_put_read(uobj);
184
185         return container_of(uobj, struct ib_uverbs_completion_event_file,
186                             uobj);
187 }
188 #define ib_uverbs_lookup_comp_file(_fd, _ufile)                                \
189         _ib_uverbs_lookup_comp_file((_fd)*typecheck(s32, _fd), _ufile)
190
191 static int ib_uverbs_get_context(struct uverbs_attr_bundle *attrs)
192 {
193         struct ib_uverbs_file *file = attrs->ufile;
194         struct ib_uverbs_get_context      cmd;
195         struct ib_uverbs_get_context_resp resp;
196         struct ib_ucontext               *ucontext;
197         struct file                      *filp;
198         struct ib_rdmacg_object          cg_obj;
199         struct ib_device *ib_dev;
200         int ret;
201
202         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
203         if (ret)
204                 return ret;
205
206         mutex_lock(&file->ucontext_lock);
207         ib_dev = srcu_dereference(file->device->ib_dev,
208                                   &file->device->disassociate_srcu);
209         if (!ib_dev) {
210                 ret = -EIO;
211                 goto err;
212         }
213
214         if (file->ucontext) {
215                 ret = -EINVAL;
216                 goto err;
217         }
218
219         ret = ib_rdmacg_try_charge(&cg_obj, ib_dev, RDMACG_RESOURCE_HCA_HANDLE);
220         if (ret)
221                 goto err;
222
223         ucontext = ib_dev->alloc_ucontext(ib_dev, &attrs->driver_udata);
224         if (IS_ERR(ucontext)) {
225                 ret = PTR_ERR(ucontext);
226                 goto err_alloc;
227         }
228
229         ucontext->device = ib_dev;
230         ucontext->cg_obj = cg_obj;
231         /* ufile is required when some objects are released */
232         ucontext->ufile = file;
233
234         ucontext->closing = false;
235         ucontext->cleanup_retryable = false;
236
237 #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
238         mutex_init(&ucontext->per_mm_list_lock);
239         INIT_LIST_HEAD(&ucontext->per_mm_list);
240         if (!(ib_dev->attrs.device_cap_flags & IB_DEVICE_ON_DEMAND_PAGING))
241                 ucontext->invalidate_range = NULL;
242
243 #endif
244
245         resp.num_comp_vectors = file->device->num_comp_vectors;
246
247         ret = get_unused_fd_flags(O_CLOEXEC);
248         if (ret < 0)
249                 goto err_free;
250         resp.async_fd = ret;
251
252         filp = ib_uverbs_alloc_async_event_file(file, ib_dev);
253         if (IS_ERR(filp)) {
254                 ret = PTR_ERR(filp);
255                 goto err_fd;
256         }
257
258         ret = uverbs_response(attrs, &resp, sizeof(resp));
259         if (ret)
260                 goto err_file;
261
262         fd_install(resp.async_fd, filp);
263
264         ucontext->res.type = RDMA_RESTRACK_CTX;
265         rdma_restrack_add(&ucontext->res);
266
267         /*
268          * Make sure that ib_uverbs_get_ucontext() sees the pointer update
269          * only after all writes to setup the ucontext have completed
270          */
271         smp_store_release(&file->ucontext, ucontext);
272
273         mutex_unlock(&file->ucontext_lock);
274
275         return 0;
276
277 err_file:
278         ib_uverbs_free_async_event_file(file);
279         fput(filp);
280
281 err_fd:
282         put_unused_fd(resp.async_fd);
283
284 err_free:
285         ib_dev->dealloc_ucontext(ucontext);
286
287 err_alloc:
288         ib_rdmacg_uncharge(&cg_obj, ib_dev, RDMACG_RESOURCE_HCA_HANDLE);
289
290 err:
291         mutex_unlock(&file->ucontext_lock);
292         return ret;
293 }
294
295 static void copy_query_dev_fields(struct ib_ucontext *ucontext,
296                                   struct ib_uverbs_query_device_resp *resp,
297                                   struct ib_device_attr *attr)
298 {
299         struct ib_device *ib_dev = ucontext->device;
300
301         resp->fw_ver            = attr->fw_ver;
302         resp->node_guid         = ib_dev->node_guid;
303         resp->sys_image_guid    = attr->sys_image_guid;
304         resp->max_mr_size       = attr->max_mr_size;
305         resp->page_size_cap     = attr->page_size_cap;
306         resp->vendor_id         = attr->vendor_id;
307         resp->vendor_part_id    = attr->vendor_part_id;
308         resp->hw_ver            = attr->hw_ver;
309         resp->max_qp            = attr->max_qp;
310         resp->max_qp_wr         = attr->max_qp_wr;
311         resp->device_cap_flags  = lower_32_bits(attr->device_cap_flags);
312         resp->max_sge           = min(attr->max_send_sge, attr->max_recv_sge);
313         resp->max_sge_rd        = attr->max_sge_rd;
314         resp->max_cq            = attr->max_cq;
315         resp->max_cqe           = attr->max_cqe;
316         resp->max_mr            = attr->max_mr;
317         resp->max_pd            = attr->max_pd;
318         resp->max_qp_rd_atom    = attr->max_qp_rd_atom;
319         resp->max_ee_rd_atom    = attr->max_ee_rd_atom;
320         resp->max_res_rd_atom   = attr->max_res_rd_atom;
321         resp->max_qp_init_rd_atom       = attr->max_qp_init_rd_atom;
322         resp->max_ee_init_rd_atom       = attr->max_ee_init_rd_atom;
323         resp->atomic_cap                = attr->atomic_cap;
324         resp->max_ee                    = attr->max_ee;
325         resp->max_rdd                   = attr->max_rdd;
326         resp->max_mw                    = attr->max_mw;
327         resp->max_raw_ipv6_qp           = attr->max_raw_ipv6_qp;
328         resp->max_raw_ethy_qp           = attr->max_raw_ethy_qp;
329         resp->max_mcast_grp             = attr->max_mcast_grp;
330         resp->max_mcast_qp_attach       = attr->max_mcast_qp_attach;
331         resp->max_total_mcast_qp_attach = attr->max_total_mcast_qp_attach;
332         resp->max_ah                    = attr->max_ah;
333         resp->max_fmr                   = attr->max_fmr;
334         resp->max_map_per_fmr           = attr->max_map_per_fmr;
335         resp->max_srq                   = attr->max_srq;
336         resp->max_srq_wr                = attr->max_srq_wr;
337         resp->max_srq_sge               = attr->max_srq_sge;
338         resp->max_pkeys                 = attr->max_pkeys;
339         resp->local_ca_ack_delay        = attr->local_ca_ack_delay;
340         resp->phys_port_cnt             = ib_dev->phys_port_cnt;
341 }
342
343 static int ib_uverbs_query_device(struct uverbs_attr_bundle *attrs)
344 {
345         struct ib_uverbs_query_device      cmd;
346         struct ib_uverbs_query_device_resp resp;
347         struct ib_ucontext *ucontext;
348         int ret;
349
350         ucontext = ib_uverbs_get_ucontext(attrs);
351         if (IS_ERR(ucontext))
352                 return PTR_ERR(ucontext);
353
354         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
355         if (ret)
356                 return ret;
357
358         memset(&resp, 0, sizeof resp);
359         copy_query_dev_fields(ucontext, &resp, &ucontext->device->attrs);
360
361         return uverbs_response(attrs, &resp, sizeof(resp));
362 }
363
364 /*
365  * ib_uverbs_query_port_resp.port_cap_flags started out as just a copy of the
366  * PortInfo CapabilityMask, but was extended with unique bits.
367  */
368 static u32 make_port_cap_flags(const struct ib_port_attr *attr)
369 {
370         u32 res;
371
372         /* All IBA CapabilityMask bits are passed through here, except bit 26,
373          * which is overridden with IP_BASED_GIDS. This is due to a historical
374          * mistake in the implementation of IP_BASED_GIDS. Otherwise all other
375          * bits match the IBA definition across all kernel versions.
376          */
377         res = attr->port_cap_flags & ~(u32)IB_UVERBS_PCF_IP_BASED_GIDS;
378
379         if (attr->ip_gids)
380                 res |= IB_UVERBS_PCF_IP_BASED_GIDS;
381
382         return res;
383 }
384
385 static int ib_uverbs_query_port(struct uverbs_attr_bundle *attrs)
386 {
387         struct ib_uverbs_query_port      cmd;
388         struct ib_uverbs_query_port_resp resp;
389         struct ib_port_attr              attr;
390         int                              ret;
391         struct ib_ucontext *ucontext;
392         struct ib_device *ib_dev;
393
394         ucontext = ib_uverbs_get_ucontext(attrs);
395         if (IS_ERR(ucontext))
396                 return PTR_ERR(ucontext);
397         ib_dev = ucontext->device;
398
399         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
400         if (ret)
401                 return ret;
402
403         ret = ib_query_port(ib_dev, cmd.port_num, &attr);
404         if (ret)
405                 return ret;
406
407         memset(&resp, 0, sizeof resp);
408
409         resp.state           = attr.state;
410         resp.max_mtu         = attr.max_mtu;
411         resp.active_mtu      = attr.active_mtu;
412         resp.gid_tbl_len     = attr.gid_tbl_len;
413         resp.port_cap_flags  = make_port_cap_flags(&attr);
414         resp.max_msg_sz      = attr.max_msg_sz;
415         resp.bad_pkey_cntr   = attr.bad_pkey_cntr;
416         resp.qkey_viol_cntr  = attr.qkey_viol_cntr;
417         resp.pkey_tbl_len    = attr.pkey_tbl_len;
418
419         if (rdma_is_grh_required(ib_dev, cmd.port_num))
420                 resp.flags |= IB_UVERBS_QPF_GRH_REQUIRED;
421
422         if (rdma_cap_opa_ah(ib_dev, cmd.port_num)) {
423                 resp.lid     = OPA_TO_IB_UCAST_LID(attr.lid);
424                 resp.sm_lid  = OPA_TO_IB_UCAST_LID(attr.sm_lid);
425         } else {
426                 resp.lid     = ib_lid_cpu16(attr.lid);
427                 resp.sm_lid  = ib_lid_cpu16(attr.sm_lid);
428         }
429         resp.lmc             = attr.lmc;
430         resp.max_vl_num      = attr.max_vl_num;
431         resp.sm_sl           = attr.sm_sl;
432         resp.subnet_timeout  = attr.subnet_timeout;
433         resp.init_type_reply = attr.init_type_reply;
434         resp.active_width    = attr.active_width;
435         resp.active_speed    = attr.active_speed;
436         resp.phys_state      = attr.phys_state;
437         resp.link_layer      = rdma_port_get_link_layer(ib_dev,
438                                                         cmd.port_num);
439
440         return uverbs_response(attrs, &resp, sizeof(resp));
441 }
442
443 static int ib_uverbs_alloc_pd(struct uverbs_attr_bundle *attrs)
444 {
445         struct ib_uverbs_alloc_pd      cmd;
446         struct ib_uverbs_alloc_pd_resp resp;
447         struct ib_uobject             *uobj;
448         struct ib_pd                  *pd;
449         int                            ret;
450         struct ib_device *ib_dev;
451
452         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
453         if (ret)
454                 return ret;
455
456         uobj = uobj_alloc(UVERBS_OBJECT_PD, attrs, &ib_dev);
457         if (IS_ERR(uobj))
458                 return PTR_ERR(uobj);
459
460         pd = ib_dev->alloc_pd(ib_dev, uobj->context, &attrs->driver_udata);
461         if (IS_ERR(pd)) {
462                 ret = PTR_ERR(pd);
463                 goto err;
464         }
465
466         pd->device  = ib_dev;
467         pd->uobject = uobj;
468         pd->__internal_mr = NULL;
469         atomic_set(&pd->usecnt, 0);
470
471         uobj->object = pd;
472         memset(&resp, 0, sizeof resp);
473         resp.pd_handle = uobj->id;
474         pd->res.type = RDMA_RESTRACK_PD;
475         rdma_restrack_add(&pd->res);
476
477         ret = uverbs_response(attrs, &resp, sizeof(resp));
478         if (ret)
479                 goto err_copy;
480
481         return uobj_alloc_commit(uobj);
482
483 err_copy:
484         ib_dealloc_pd(pd);
485
486 err:
487         uobj_alloc_abort(uobj);
488         return ret;
489 }
490
491 static int ib_uverbs_dealloc_pd(struct uverbs_attr_bundle *attrs)
492 {
493         struct ib_uverbs_dealloc_pd cmd;
494         int ret;
495
496         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
497         if (ret)
498                 return ret;
499
500         return uobj_perform_destroy(UVERBS_OBJECT_PD, cmd.pd_handle, attrs);
501 }
502
503 struct xrcd_table_entry {
504         struct rb_node  node;
505         struct ib_xrcd *xrcd;
506         struct inode   *inode;
507 };
508
509 static int xrcd_table_insert(struct ib_uverbs_device *dev,
510                             struct inode *inode,
511                             struct ib_xrcd *xrcd)
512 {
513         struct xrcd_table_entry *entry, *scan;
514         struct rb_node **p = &dev->xrcd_tree.rb_node;
515         struct rb_node *parent = NULL;
516
517         entry = kmalloc(sizeof *entry, GFP_KERNEL);
518         if (!entry)
519                 return -ENOMEM;
520
521         entry->xrcd  = xrcd;
522         entry->inode = inode;
523
524         while (*p) {
525                 parent = *p;
526                 scan = rb_entry(parent, struct xrcd_table_entry, node);
527
528                 if (inode < scan->inode) {
529                         p = &(*p)->rb_left;
530                 } else if (inode > scan->inode) {
531                         p = &(*p)->rb_right;
532                 } else {
533                         kfree(entry);
534                         return -EEXIST;
535                 }
536         }
537
538         rb_link_node(&entry->node, parent, p);
539         rb_insert_color(&entry->node, &dev->xrcd_tree);
540         igrab(inode);
541         return 0;
542 }
543
544 static struct xrcd_table_entry *xrcd_table_search(struct ib_uverbs_device *dev,
545                                                   struct inode *inode)
546 {
547         struct xrcd_table_entry *entry;
548         struct rb_node *p = dev->xrcd_tree.rb_node;
549
550         while (p) {
551                 entry = rb_entry(p, struct xrcd_table_entry, node);
552
553                 if (inode < entry->inode)
554                         p = p->rb_left;
555                 else if (inode > entry->inode)
556                         p = p->rb_right;
557                 else
558                         return entry;
559         }
560
561         return NULL;
562 }
563
564 static struct ib_xrcd *find_xrcd(struct ib_uverbs_device *dev, struct inode *inode)
565 {
566         struct xrcd_table_entry *entry;
567
568         entry = xrcd_table_search(dev, inode);
569         if (!entry)
570                 return NULL;
571
572         return entry->xrcd;
573 }
574
575 static void xrcd_table_delete(struct ib_uverbs_device *dev,
576                               struct inode *inode)
577 {
578         struct xrcd_table_entry *entry;
579
580         entry = xrcd_table_search(dev, inode);
581         if (entry) {
582                 iput(inode);
583                 rb_erase(&entry->node, &dev->xrcd_tree);
584                 kfree(entry);
585         }
586 }
587
588 static int ib_uverbs_open_xrcd(struct uverbs_attr_bundle *attrs)
589 {
590         struct ib_uverbs_device *ibudev = attrs->ufile->device;
591         struct ib_uverbs_open_xrcd      cmd;
592         struct ib_uverbs_open_xrcd_resp resp;
593         struct ib_uxrcd_object         *obj;
594         struct ib_xrcd                 *xrcd = NULL;
595         struct fd                       f = {NULL, 0};
596         struct inode                   *inode = NULL;
597         int                             ret = 0;
598         int                             new_xrcd = 0;
599         struct ib_device *ib_dev;
600
601         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
602         if (ret)
603                 return ret;
604
605         mutex_lock(&ibudev->xrcd_tree_mutex);
606
607         if (cmd.fd != -1) {
608                 /* search for file descriptor */
609                 f = fdget(cmd.fd);
610                 if (!f.file) {
611                         ret = -EBADF;
612                         goto err_tree_mutex_unlock;
613                 }
614
615                 inode = file_inode(f.file);
616                 xrcd = find_xrcd(ibudev, inode);
617                 if (!xrcd && !(cmd.oflags & O_CREAT)) {
618                         /* no file descriptor. Need CREATE flag */
619                         ret = -EAGAIN;
620                         goto err_tree_mutex_unlock;
621                 }
622
623                 if (xrcd && cmd.oflags & O_EXCL) {
624                         ret = -EINVAL;
625                         goto err_tree_mutex_unlock;
626                 }
627         }
628
629         obj = (struct ib_uxrcd_object *)uobj_alloc(UVERBS_OBJECT_XRCD, attrs,
630                                                    &ib_dev);
631         if (IS_ERR(obj)) {
632                 ret = PTR_ERR(obj);
633                 goto err_tree_mutex_unlock;
634         }
635
636         if (!xrcd) {
637                 xrcd = ib_dev->alloc_xrcd(ib_dev, obj->uobject.context,
638                                           &attrs->driver_udata);
639                 if (IS_ERR(xrcd)) {
640                         ret = PTR_ERR(xrcd);
641                         goto err;
642                 }
643
644                 xrcd->inode   = inode;
645                 xrcd->device  = ib_dev;
646                 atomic_set(&xrcd->usecnt, 0);
647                 mutex_init(&xrcd->tgt_qp_mutex);
648                 INIT_LIST_HEAD(&xrcd->tgt_qp_list);
649                 new_xrcd = 1;
650         }
651
652         atomic_set(&obj->refcnt, 0);
653         obj->uobject.object = xrcd;
654         memset(&resp, 0, sizeof resp);
655         resp.xrcd_handle = obj->uobject.id;
656
657         if (inode) {
658                 if (new_xrcd) {
659                         /* create new inode/xrcd table entry */
660                         ret = xrcd_table_insert(ibudev, inode, xrcd);
661                         if (ret)
662                                 goto err_dealloc_xrcd;
663                 }
664                 atomic_inc(&xrcd->usecnt);
665         }
666
667         ret = uverbs_response(attrs, &resp, sizeof(resp));
668         if (ret)
669                 goto err_copy;
670
671         if (f.file)
672                 fdput(f);
673
674         mutex_unlock(&ibudev->xrcd_tree_mutex);
675
676         return uobj_alloc_commit(&obj->uobject);
677
678 err_copy:
679         if (inode) {
680                 if (new_xrcd)
681                         xrcd_table_delete(ibudev, inode);
682                 atomic_dec(&xrcd->usecnt);
683         }
684
685 err_dealloc_xrcd:
686         ib_dealloc_xrcd(xrcd);
687
688 err:
689         uobj_alloc_abort(&obj->uobject);
690
691 err_tree_mutex_unlock:
692         if (f.file)
693                 fdput(f);
694
695         mutex_unlock(&ibudev->xrcd_tree_mutex);
696
697         return ret;
698 }
699
700 static int ib_uverbs_close_xrcd(struct uverbs_attr_bundle *attrs)
701 {
702         struct ib_uverbs_close_xrcd cmd;
703         int ret;
704
705         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
706         if (ret)
707                 return ret;
708
709         return uobj_perform_destroy(UVERBS_OBJECT_XRCD, cmd.xrcd_handle, attrs);
710 }
711
712 int ib_uverbs_dealloc_xrcd(struct ib_uobject *uobject,
713                            struct ib_xrcd *xrcd,
714                            enum rdma_remove_reason why)
715 {
716         struct inode *inode;
717         int ret;
718         struct ib_uverbs_device *dev = uobject->context->ufile->device;
719
720         inode = xrcd->inode;
721         if (inode && !atomic_dec_and_test(&xrcd->usecnt))
722                 return 0;
723
724         ret = ib_dealloc_xrcd(xrcd);
725
726         if (ib_is_destroy_retryable(ret, why, uobject)) {
727                 atomic_inc(&xrcd->usecnt);
728                 return ret;
729         }
730
731         if (inode)
732                 xrcd_table_delete(dev, inode);
733
734         return ret;
735 }
736
737 static int ib_uverbs_reg_mr(struct uverbs_attr_bundle *attrs)
738 {
739         struct ib_uverbs_reg_mr      cmd;
740         struct ib_uverbs_reg_mr_resp resp;
741         struct ib_uobject           *uobj;
742         struct ib_pd                *pd;
743         struct ib_mr                *mr;
744         int                          ret;
745         struct ib_device *ib_dev;
746
747         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
748         if (ret)
749                 return ret;
750
751         if ((cmd.start & ~PAGE_MASK) != (cmd.hca_va & ~PAGE_MASK))
752                 return -EINVAL;
753
754         ret = ib_check_mr_access(cmd.access_flags);
755         if (ret)
756                 return ret;
757
758         uobj = uobj_alloc(UVERBS_OBJECT_MR, attrs, &ib_dev);
759         if (IS_ERR(uobj))
760                 return PTR_ERR(uobj);
761
762         pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs);
763         if (!pd) {
764                 ret = -EINVAL;
765                 goto err_free;
766         }
767
768         if (cmd.access_flags & IB_ACCESS_ON_DEMAND) {
769                 if (!(pd->device->attrs.device_cap_flags &
770                       IB_DEVICE_ON_DEMAND_PAGING)) {
771                         pr_debug("ODP support not available\n");
772                         ret = -EINVAL;
773                         goto err_put;
774                 }
775         }
776
777         mr = pd->device->reg_user_mr(pd, cmd.start, cmd.length, cmd.hca_va,
778                                      cmd.access_flags, &attrs->driver_udata);
779         if (IS_ERR(mr)) {
780                 ret = PTR_ERR(mr);
781                 goto err_put;
782         }
783
784         mr->device  = pd->device;
785         mr->pd      = pd;
786         mr->dm      = NULL;
787         mr->uobject = uobj;
788         atomic_inc(&pd->usecnt);
789         mr->res.type = RDMA_RESTRACK_MR;
790         rdma_restrack_add(&mr->res);
791
792         uobj->object = mr;
793
794         memset(&resp, 0, sizeof resp);
795         resp.lkey      = mr->lkey;
796         resp.rkey      = mr->rkey;
797         resp.mr_handle = uobj->id;
798
799         ret = uverbs_response(attrs, &resp, sizeof(resp));
800         if (ret)
801                 goto err_copy;
802
803         uobj_put_obj_read(pd);
804
805         return uobj_alloc_commit(uobj);
806
807 err_copy:
808         ib_dereg_mr(mr);
809
810 err_put:
811         uobj_put_obj_read(pd);
812
813 err_free:
814         uobj_alloc_abort(uobj);
815         return ret;
816 }
817
818 static int ib_uverbs_rereg_mr(struct uverbs_attr_bundle *attrs)
819 {
820         struct ib_uverbs_rereg_mr      cmd;
821         struct ib_uverbs_rereg_mr_resp resp;
822         struct ib_pd                *pd = NULL;
823         struct ib_mr                *mr;
824         struct ib_pd                *old_pd;
825         int                          ret;
826         struct ib_uobject           *uobj;
827
828         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
829         if (ret)
830                 return ret;
831
832         if (cmd.flags & ~IB_MR_REREG_SUPPORTED || !cmd.flags)
833                 return -EINVAL;
834
835         if ((cmd.flags & IB_MR_REREG_TRANS) &&
836             (!cmd.start || !cmd.hca_va || 0 >= cmd.length ||
837              (cmd.start & ~PAGE_MASK) != (cmd.hca_va & ~PAGE_MASK)))
838                         return -EINVAL;
839
840         uobj = uobj_get_write(UVERBS_OBJECT_MR, cmd.mr_handle, attrs);
841         if (IS_ERR(uobj))
842                 return PTR_ERR(uobj);
843
844         mr = uobj->object;
845
846         if (mr->dm) {
847                 ret = -EINVAL;
848                 goto put_uobjs;
849         }
850
851         if (cmd.flags & IB_MR_REREG_ACCESS) {
852                 ret = ib_check_mr_access(cmd.access_flags);
853                 if (ret)
854                         goto put_uobjs;
855         }
856
857         if (cmd.flags & IB_MR_REREG_PD) {
858                 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle,
859                                        attrs);
860                 if (!pd) {
861                         ret = -EINVAL;
862                         goto put_uobjs;
863                 }
864         }
865
866         old_pd = mr->pd;
867         ret = mr->device->rereg_user_mr(mr, cmd.flags, cmd.start, cmd.length,
868                                         cmd.hca_va, cmd.access_flags, pd,
869                                         &attrs->driver_udata);
870         if (!ret) {
871                 if (cmd.flags & IB_MR_REREG_PD) {
872                         atomic_inc(&pd->usecnt);
873                         mr->pd = pd;
874                         atomic_dec(&old_pd->usecnt);
875                 }
876         } else {
877                 goto put_uobj_pd;
878         }
879
880         memset(&resp, 0, sizeof(resp));
881         resp.lkey      = mr->lkey;
882         resp.rkey      = mr->rkey;
883
884         ret = uverbs_response(attrs, &resp, sizeof(resp));
885
886 put_uobj_pd:
887         if (cmd.flags & IB_MR_REREG_PD)
888                 uobj_put_obj_read(pd);
889
890 put_uobjs:
891         uobj_put_write(uobj);
892
893         return ret;
894 }
895
896 static int ib_uverbs_dereg_mr(struct uverbs_attr_bundle *attrs)
897 {
898         struct ib_uverbs_dereg_mr cmd;
899         int ret;
900
901         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
902         if (ret)
903                 return ret;
904
905         return uobj_perform_destroy(UVERBS_OBJECT_MR, cmd.mr_handle, attrs);
906 }
907
908 static int ib_uverbs_alloc_mw(struct uverbs_attr_bundle *attrs)
909 {
910         struct ib_uverbs_alloc_mw      cmd;
911         struct ib_uverbs_alloc_mw_resp resp;
912         struct ib_uobject             *uobj;
913         struct ib_pd                  *pd;
914         struct ib_mw                  *mw;
915         int                            ret;
916         struct ib_device *ib_dev;
917
918         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
919         if (ret)
920                 return ret;
921
922         uobj = uobj_alloc(UVERBS_OBJECT_MW, attrs, &ib_dev);
923         if (IS_ERR(uobj))
924                 return PTR_ERR(uobj);
925
926         pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs);
927         if (!pd) {
928                 ret = -EINVAL;
929                 goto err_free;
930         }
931
932         mw = pd->device->alloc_mw(pd, cmd.mw_type, &attrs->driver_udata);
933         if (IS_ERR(mw)) {
934                 ret = PTR_ERR(mw);
935                 goto err_put;
936         }
937
938         mw->device  = pd->device;
939         mw->pd      = pd;
940         mw->uobject = uobj;
941         atomic_inc(&pd->usecnt);
942
943         uobj->object = mw;
944
945         memset(&resp, 0, sizeof(resp));
946         resp.rkey      = mw->rkey;
947         resp.mw_handle = uobj->id;
948
949         ret = uverbs_response(attrs, &resp, sizeof(resp));
950         if (ret)
951                 goto err_copy;
952
953         uobj_put_obj_read(pd);
954         return uobj_alloc_commit(uobj);
955
956 err_copy:
957         uverbs_dealloc_mw(mw);
958 err_put:
959         uobj_put_obj_read(pd);
960 err_free:
961         uobj_alloc_abort(uobj);
962         return ret;
963 }
964
965 static int ib_uverbs_dealloc_mw(struct uverbs_attr_bundle *attrs)
966 {
967         struct ib_uverbs_dealloc_mw cmd;
968         int ret;
969
970         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
971         if (ret)
972                 return ret;
973
974         return uobj_perform_destroy(UVERBS_OBJECT_MW, cmd.mw_handle, attrs);
975 }
976
977 static int ib_uverbs_create_comp_channel(struct uverbs_attr_bundle *attrs)
978 {
979         struct ib_uverbs_create_comp_channel       cmd;
980         struct ib_uverbs_create_comp_channel_resp  resp;
981         struct ib_uobject                         *uobj;
982         struct ib_uverbs_completion_event_file    *ev_file;
983         struct ib_device *ib_dev;
984         int ret;
985
986         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
987         if (ret)
988                 return ret;
989
990         uobj = uobj_alloc(UVERBS_OBJECT_COMP_CHANNEL, attrs, &ib_dev);
991         if (IS_ERR(uobj))
992                 return PTR_ERR(uobj);
993
994         resp.fd = uobj->id;
995
996         ev_file = container_of(uobj, struct ib_uverbs_completion_event_file,
997                                uobj);
998         ib_uverbs_init_event_queue(&ev_file->ev_queue);
999
1000         ret = uverbs_response(attrs, &resp, sizeof(resp));
1001         if (ret) {
1002                 uobj_alloc_abort(uobj);
1003                 return ret;
1004         }
1005
1006         return uobj_alloc_commit(uobj);
1007 }
1008
1009 static struct ib_ucq_object *create_cq(struct uverbs_attr_bundle *attrs,
1010                                        struct ib_uverbs_ex_create_cq *cmd)
1011 {
1012         struct ib_ucq_object           *obj;
1013         struct ib_uverbs_completion_event_file    *ev_file = NULL;
1014         struct ib_cq                   *cq;
1015         int                             ret;
1016         struct ib_uverbs_ex_create_cq_resp resp;
1017         struct ib_cq_init_attr attr = {};
1018         struct ib_device *ib_dev;
1019
1020         if (cmd->comp_vector >= attrs->ufile->device->num_comp_vectors)
1021                 return ERR_PTR(-EINVAL);
1022
1023         obj = (struct ib_ucq_object *)uobj_alloc(UVERBS_OBJECT_CQ, attrs,
1024                                                  &ib_dev);
1025         if (IS_ERR(obj))
1026                 return obj;
1027
1028         if (cmd->comp_channel >= 0) {
1029                 ev_file = ib_uverbs_lookup_comp_file(cmd->comp_channel, attrs);
1030                 if (IS_ERR(ev_file)) {
1031                         ret = PTR_ERR(ev_file);
1032                         goto err;
1033                 }
1034         }
1035
1036         obj->uobject.user_handle = cmd->user_handle;
1037         obj->comp_events_reported  = 0;
1038         obj->async_events_reported = 0;
1039         INIT_LIST_HEAD(&obj->comp_list);
1040         INIT_LIST_HEAD(&obj->async_list);
1041
1042         attr.cqe = cmd->cqe;
1043         attr.comp_vector = cmd->comp_vector;
1044         attr.flags = cmd->flags;
1045
1046         cq = ib_dev->create_cq(ib_dev, &attr, obj->uobject.context,
1047                                &attrs->driver_udata);
1048         if (IS_ERR(cq)) {
1049                 ret = PTR_ERR(cq);
1050                 goto err_file;
1051         }
1052
1053         cq->device        = ib_dev;
1054         cq->uobject       = &obj->uobject;
1055         cq->comp_handler  = ib_uverbs_comp_handler;
1056         cq->event_handler = ib_uverbs_cq_event_handler;
1057         cq->cq_context    = ev_file ? &ev_file->ev_queue : NULL;
1058         atomic_set(&cq->usecnt, 0);
1059
1060         obj->uobject.object = cq;
1061         memset(&resp, 0, sizeof resp);
1062         resp.base.cq_handle = obj->uobject.id;
1063         resp.base.cqe       = cq->cqe;
1064         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
1065
1066         cq->res.type = RDMA_RESTRACK_CQ;
1067         rdma_restrack_add(&cq->res);
1068
1069         ret = uverbs_response(attrs, &resp, sizeof(resp));
1070         if (ret)
1071                 goto err_cb;
1072
1073         ret = uobj_alloc_commit(&obj->uobject);
1074         if (ret)
1075                 return ERR_PTR(ret);
1076         return obj;
1077
1078 err_cb:
1079         ib_destroy_cq(cq);
1080
1081 err_file:
1082         if (ev_file)
1083                 ib_uverbs_release_ucq(attrs->ufile, ev_file, obj);
1084
1085 err:
1086         uobj_alloc_abort(&obj->uobject);
1087
1088         return ERR_PTR(ret);
1089 }
1090
1091 static int ib_uverbs_create_cq(struct uverbs_attr_bundle *attrs)
1092 {
1093         struct ib_uverbs_create_cq      cmd;
1094         struct ib_uverbs_ex_create_cq   cmd_ex;
1095         struct ib_ucq_object           *obj;
1096         int ret;
1097
1098         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1099         if (ret)
1100                 return ret;
1101
1102         memset(&cmd_ex, 0, sizeof(cmd_ex));
1103         cmd_ex.user_handle = cmd.user_handle;
1104         cmd_ex.cqe = cmd.cqe;
1105         cmd_ex.comp_vector = cmd.comp_vector;
1106         cmd_ex.comp_channel = cmd.comp_channel;
1107
1108         obj = create_cq(attrs, &cmd_ex);
1109         return PTR_ERR_OR_ZERO(obj);
1110 }
1111
1112 static int ib_uverbs_ex_create_cq(struct uverbs_attr_bundle *attrs)
1113 {
1114         struct ib_uverbs_ex_create_cq  cmd;
1115         struct ib_ucq_object           *obj;
1116         int ret;
1117
1118         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1119         if (ret)
1120                 return ret;
1121
1122         if (cmd.comp_mask)
1123                 return -EINVAL;
1124
1125         if (cmd.reserved)
1126                 return -EINVAL;
1127
1128         obj = create_cq(attrs, &cmd);
1129         return PTR_ERR_OR_ZERO(obj);
1130 }
1131
1132 static int ib_uverbs_resize_cq(struct uverbs_attr_bundle *attrs)
1133 {
1134         struct ib_uverbs_resize_cq      cmd;
1135         struct ib_uverbs_resize_cq_resp resp = {};
1136         struct ib_cq                    *cq;
1137         int                             ret = -EINVAL;
1138
1139         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1140         if (ret)
1141                 return ret;
1142
1143         cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
1144         if (!cq)
1145                 return -EINVAL;
1146
1147         ret = cq->device->resize_cq(cq, cmd.cqe, &attrs->driver_udata);
1148         if (ret)
1149                 goto out;
1150
1151         resp.cqe = cq->cqe;
1152
1153         ret = uverbs_response(attrs, &resp, sizeof(resp));
1154 out:
1155         uobj_put_obj_read(cq);
1156
1157         return ret;
1158 }
1159
1160 static int copy_wc_to_user(struct ib_device *ib_dev, void __user *dest,
1161                            struct ib_wc *wc)
1162 {
1163         struct ib_uverbs_wc tmp;
1164
1165         tmp.wr_id               = wc->wr_id;
1166         tmp.status              = wc->status;
1167         tmp.opcode              = wc->opcode;
1168         tmp.vendor_err          = wc->vendor_err;
1169         tmp.byte_len            = wc->byte_len;
1170         tmp.ex.imm_data         = wc->ex.imm_data;
1171         tmp.qp_num              = wc->qp->qp_num;
1172         tmp.src_qp              = wc->src_qp;
1173         tmp.wc_flags            = wc->wc_flags;
1174         tmp.pkey_index          = wc->pkey_index;
1175         if (rdma_cap_opa_ah(ib_dev, wc->port_num))
1176                 tmp.slid        = OPA_TO_IB_UCAST_LID(wc->slid);
1177         else
1178                 tmp.slid        = ib_lid_cpu16(wc->slid);
1179         tmp.sl                  = wc->sl;
1180         tmp.dlid_path_bits      = wc->dlid_path_bits;
1181         tmp.port_num            = wc->port_num;
1182         tmp.reserved            = 0;
1183
1184         if (copy_to_user(dest, &tmp, sizeof tmp))
1185                 return -EFAULT;
1186
1187         return 0;
1188 }
1189
1190 static int ib_uverbs_poll_cq(struct uverbs_attr_bundle *attrs)
1191 {
1192         struct ib_uverbs_poll_cq       cmd;
1193         struct ib_uverbs_poll_cq_resp  resp;
1194         u8 __user                     *header_ptr;
1195         u8 __user                     *data_ptr;
1196         struct ib_cq                  *cq;
1197         struct ib_wc                   wc;
1198         int                            ret;
1199
1200         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1201         if (ret)
1202                 return ret;
1203
1204         cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
1205         if (!cq)
1206                 return -EINVAL;
1207
1208         /* we copy a struct ib_uverbs_poll_cq_resp to user space */
1209         header_ptr = attrs->ucore.outbuf;
1210         data_ptr = header_ptr + sizeof resp;
1211
1212         memset(&resp, 0, sizeof resp);
1213         while (resp.count < cmd.ne) {
1214                 ret = ib_poll_cq(cq, 1, &wc);
1215                 if (ret < 0)
1216                         goto out_put;
1217                 if (!ret)
1218                         break;
1219
1220                 ret = copy_wc_to_user(cq->device, data_ptr, &wc);
1221                 if (ret)
1222                         goto out_put;
1223
1224                 data_ptr += sizeof(struct ib_uverbs_wc);
1225                 ++resp.count;
1226         }
1227
1228         if (copy_to_user(header_ptr, &resp, sizeof resp)) {
1229                 ret = -EFAULT;
1230                 goto out_put;
1231         }
1232
1233         ret = 0;
1234
1235 out_put:
1236         uobj_put_obj_read(cq);
1237         return ret;
1238 }
1239
1240 static int ib_uverbs_req_notify_cq(struct uverbs_attr_bundle *attrs)
1241 {
1242         struct ib_uverbs_req_notify_cq cmd;
1243         struct ib_cq                  *cq;
1244         int ret;
1245
1246         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1247         if (ret)
1248                 return ret;
1249
1250         cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
1251         if (!cq)
1252                 return -EINVAL;
1253
1254         ib_req_notify_cq(cq, cmd.solicited_only ?
1255                          IB_CQ_SOLICITED : IB_CQ_NEXT_COMP);
1256
1257         uobj_put_obj_read(cq);
1258
1259         return 0;
1260 }
1261
1262 static int ib_uverbs_destroy_cq(struct uverbs_attr_bundle *attrs)
1263 {
1264         struct ib_uverbs_destroy_cq      cmd;
1265         struct ib_uverbs_destroy_cq_resp resp;
1266         struct ib_uobject               *uobj;
1267         struct ib_ucq_object            *obj;
1268         int ret;
1269
1270         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1271         if (ret)
1272                 return ret;
1273
1274         uobj = uobj_get_destroy(UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
1275         if (IS_ERR(uobj))
1276                 return PTR_ERR(uobj);
1277
1278         obj = container_of(uobj, struct ib_ucq_object, uobject);
1279         memset(&resp, 0, sizeof(resp));
1280         resp.comp_events_reported  = obj->comp_events_reported;
1281         resp.async_events_reported = obj->async_events_reported;
1282
1283         uobj_put_destroy(uobj);
1284
1285         return uverbs_response(attrs, &resp, sizeof(resp));
1286 }
1287
1288 static int create_qp(struct uverbs_attr_bundle *attrs,
1289                      struct ib_uverbs_ex_create_qp *cmd)
1290 {
1291         struct ib_uqp_object            *obj;
1292         struct ib_device                *device;
1293         struct ib_pd                    *pd = NULL;
1294         struct ib_xrcd                  *xrcd = NULL;
1295         struct ib_uobject               *xrcd_uobj = ERR_PTR(-ENOENT);
1296         struct ib_cq                    *scq = NULL, *rcq = NULL;
1297         struct ib_srq                   *srq = NULL;
1298         struct ib_qp                    *qp;
1299         struct ib_qp_init_attr          attr = {};
1300         struct ib_uverbs_ex_create_qp_resp resp;
1301         int                             ret;
1302         struct ib_rwq_ind_table *ind_tbl = NULL;
1303         bool has_sq = true;
1304         struct ib_device *ib_dev;
1305
1306         if (cmd->qp_type == IB_QPT_RAW_PACKET && !capable(CAP_NET_RAW))
1307                 return -EPERM;
1308
1309         obj = (struct ib_uqp_object *)uobj_alloc(UVERBS_OBJECT_QP, attrs,
1310                                                  &ib_dev);
1311         if (IS_ERR(obj))
1312                 return PTR_ERR(obj);
1313         obj->uxrcd = NULL;
1314         obj->uevent.uobject.user_handle = cmd->user_handle;
1315         mutex_init(&obj->mcast_lock);
1316
1317         if (cmd->comp_mask & IB_UVERBS_CREATE_QP_MASK_IND_TABLE) {
1318                 ind_tbl = uobj_get_obj_read(rwq_ind_table,
1319                                             UVERBS_OBJECT_RWQ_IND_TBL,
1320                                             cmd->rwq_ind_tbl_handle, attrs);
1321                 if (!ind_tbl) {
1322                         ret = -EINVAL;
1323                         goto err_put;
1324                 }
1325
1326                 attr.rwq_ind_tbl = ind_tbl;
1327         }
1328
1329         if (ind_tbl && (cmd->max_recv_wr || cmd->max_recv_sge || cmd->is_srq)) {
1330                 ret = -EINVAL;
1331                 goto err_put;
1332         }
1333
1334         if (ind_tbl && !cmd->max_send_wr)
1335                 has_sq = false;
1336
1337         if (cmd->qp_type == IB_QPT_XRC_TGT) {
1338                 xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd->pd_handle,
1339                                           attrs);
1340
1341                 if (IS_ERR(xrcd_uobj)) {
1342                         ret = -EINVAL;
1343                         goto err_put;
1344                 }
1345
1346                 xrcd = (struct ib_xrcd *)xrcd_uobj->object;
1347                 if (!xrcd) {
1348                         ret = -EINVAL;
1349                         goto err_put;
1350                 }
1351                 device = xrcd->device;
1352         } else {
1353                 if (cmd->qp_type == IB_QPT_XRC_INI) {
1354                         cmd->max_recv_wr = 0;
1355                         cmd->max_recv_sge = 0;
1356                 } else {
1357                         if (cmd->is_srq) {
1358                                 srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ,
1359                                                         cmd->srq_handle, attrs);
1360                                 if (!srq || srq->srq_type == IB_SRQT_XRC) {
1361                                         ret = -EINVAL;
1362                                         goto err_put;
1363                                 }
1364                         }
1365
1366                         if (!ind_tbl) {
1367                                 if (cmd->recv_cq_handle != cmd->send_cq_handle) {
1368                                         rcq = uobj_get_obj_read(
1369                                                 cq, UVERBS_OBJECT_CQ,
1370                                                 cmd->recv_cq_handle, attrs);
1371                                         if (!rcq) {
1372                                                 ret = -EINVAL;
1373                                                 goto err_put;
1374                                         }
1375                                 }
1376                         }
1377                 }
1378
1379                 if (has_sq)
1380                         scq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ,
1381                                                 cmd->send_cq_handle, attrs);
1382                 if (!ind_tbl)
1383                         rcq = rcq ?: scq;
1384                 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd->pd_handle,
1385                                        attrs);
1386                 if (!pd || (!scq && has_sq)) {
1387                         ret = -EINVAL;
1388                         goto err_put;
1389                 }
1390
1391                 device = pd->device;
1392         }
1393
1394         attr.event_handler = ib_uverbs_qp_event_handler;
1395         attr.qp_context    = attrs->ufile;
1396         attr.send_cq       = scq;
1397         attr.recv_cq       = rcq;
1398         attr.srq           = srq;
1399         attr.xrcd          = xrcd;
1400         attr.sq_sig_type   = cmd->sq_sig_all ? IB_SIGNAL_ALL_WR :
1401                                               IB_SIGNAL_REQ_WR;
1402         attr.qp_type       = cmd->qp_type;
1403         attr.create_flags  = 0;
1404
1405         attr.cap.max_send_wr     = cmd->max_send_wr;
1406         attr.cap.max_recv_wr     = cmd->max_recv_wr;
1407         attr.cap.max_send_sge    = cmd->max_send_sge;
1408         attr.cap.max_recv_sge    = cmd->max_recv_sge;
1409         attr.cap.max_inline_data = cmd->max_inline_data;
1410
1411         obj->uevent.events_reported     = 0;
1412         INIT_LIST_HEAD(&obj->uevent.event_list);
1413         INIT_LIST_HEAD(&obj->mcast_list);
1414
1415         attr.create_flags = cmd->create_flags;
1416         if (attr.create_flags & ~(IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK |
1417                                 IB_QP_CREATE_CROSS_CHANNEL |
1418                                 IB_QP_CREATE_MANAGED_SEND |
1419                                 IB_QP_CREATE_MANAGED_RECV |
1420                                 IB_QP_CREATE_SCATTER_FCS |
1421                                 IB_QP_CREATE_CVLAN_STRIPPING |
1422                                 IB_QP_CREATE_SOURCE_QPN |
1423                                 IB_QP_CREATE_PCI_WRITE_END_PADDING)) {
1424                 ret = -EINVAL;
1425                 goto err_put;
1426         }
1427
1428         if (attr.create_flags & IB_QP_CREATE_SOURCE_QPN) {
1429                 if (!capable(CAP_NET_RAW)) {
1430                         ret = -EPERM;
1431                         goto err_put;
1432                 }
1433
1434                 attr.source_qpn = cmd->source_qpn;
1435         }
1436
1437         if (cmd->qp_type == IB_QPT_XRC_TGT)
1438                 qp = ib_create_qp(pd, &attr);
1439         else
1440                 qp = _ib_create_qp(device, pd, &attr, &attrs->driver_udata,
1441                                    &obj->uevent.uobject);
1442
1443         if (IS_ERR(qp)) {
1444                 ret = PTR_ERR(qp);
1445                 goto err_put;
1446         }
1447
1448         if (cmd->qp_type != IB_QPT_XRC_TGT) {
1449                 ret = ib_create_qp_security(qp, device);
1450                 if (ret)
1451                         goto err_cb;
1452
1453                 qp->real_qp       = qp;
1454                 qp->pd            = pd;
1455                 qp->send_cq       = attr.send_cq;
1456                 qp->recv_cq       = attr.recv_cq;
1457                 qp->srq           = attr.srq;
1458                 qp->rwq_ind_tbl   = ind_tbl;
1459                 qp->event_handler = attr.event_handler;
1460                 qp->qp_context    = attr.qp_context;
1461                 qp->qp_type       = attr.qp_type;
1462                 atomic_set(&qp->usecnt, 0);
1463                 atomic_inc(&pd->usecnt);
1464                 qp->port = 0;
1465                 if (attr.send_cq)
1466                         atomic_inc(&attr.send_cq->usecnt);
1467                 if (attr.recv_cq)
1468                         atomic_inc(&attr.recv_cq->usecnt);
1469                 if (attr.srq)
1470                         atomic_inc(&attr.srq->usecnt);
1471                 if (ind_tbl)
1472                         atomic_inc(&ind_tbl->usecnt);
1473         } else {
1474                 /* It is done in _ib_create_qp for other QP types */
1475                 qp->uobject = &obj->uevent.uobject;
1476         }
1477
1478         obj->uevent.uobject.object = qp;
1479
1480         memset(&resp, 0, sizeof resp);
1481         resp.base.qpn             = qp->qp_num;
1482         resp.base.qp_handle       = obj->uevent.uobject.id;
1483         resp.base.max_recv_sge    = attr.cap.max_recv_sge;
1484         resp.base.max_send_sge    = attr.cap.max_send_sge;
1485         resp.base.max_recv_wr     = attr.cap.max_recv_wr;
1486         resp.base.max_send_wr     = attr.cap.max_send_wr;
1487         resp.base.max_inline_data = attr.cap.max_inline_data;
1488         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
1489
1490         ret = uverbs_response(attrs, &resp, sizeof(resp));
1491         if (ret)
1492                 goto err_cb;
1493
1494         if (xrcd) {
1495                 obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object,
1496                                           uobject);
1497                 atomic_inc(&obj->uxrcd->refcnt);
1498                 uobj_put_read(xrcd_uobj);
1499         }
1500
1501         if (pd)
1502                 uobj_put_obj_read(pd);
1503         if (scq)
1504                 uobj_put_obj_read(scq);
1505         if (rcq && rcq != scq)
1506                 uobj_put_obj_read(rcq);
1507         if (srq)
1508                 uobj_put_obj_read(srq);
1509         if (ind_tbl)
1510                 uobj_put_obj_read(ind_tbl);
1511
1512         return uobj_alloc_commit(&obj->uevent.uobject);
1513 err_cb:
1514         ib_destroy_qp(qp);
1515
1516 err_put:
1517         if (!IS_ERR(xrcd_uobj))
1518                 uobj_put_read(xrcd_uobj);
1519         if (pd)
1520                 uobj_put_obj_read(pd);
1521         if (scq)
1522                 uobj_put_obj_read(scq);
1523         if (rcq && rcq != scq)
1524                 uobj_put_obj_read(rcq);
1525         if (srq)
1526                 uobj_put_obj_read(srq);
1527         if (ind_tbl)
1528                 uobj_put_obj_read(ind_tbl);
1529
1530         uobj_alloc_abort(&obj->uevent.uobject);
1531         return ret;
1532 }
1533
1534 static int ib_uverbs_create_qp(struct uverbs_attr_bundle *attrs)
1535 {
1536         struct ib_uverbs_create_qp      cmd;
1537         struct ib_uverbs_ex_create_qp   cmd_ex;
1538         int ret;
1539
1540         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1541         if (ret)
1542                 return ret;
1543
1544         memset(&cmd_ex, 0, sizeof(cmd_ex));
1545         cmd_ex.user_handle = cmd.user_handle;
1546         cmd_ex.pd_handle = cmd.pd_handle;
1547         cmd_ex.send_cq_handle = cmd.send_cq_handle;
1548         cmd_ex.recv_cq_handle = cmd.recv_cq_handle;
1549         cmd_ex.srq_handle = cmd.srq_handle;
1550         cmd_ex.max_send_wr = cmd.max_send_wr;
1551         cmd_ex.max_recv_wr = cmd.max_recv_wr;
1552         cmd_ex.max_send_sge = cmd.max_send_sge;
1553         cmd_ex.max_recv_sge = cmd.max_recv_sge;
1554         cmd_ex.max_inline_data = cmd.max_inline_data;
1555         cmd_ex.sq_sig_all = cmd.sq_sig_all;
1556         cmd_ex.qp_type = cmd.qp_type;
1557         cmd_ex.is_srq = cmd.is_srq;
1558
1559         return create_qp(attrs, &cmd_ex);
1560 }
1561
1562 static int ib_uverbs_ex_create_qp(struct uverbs_attr_bundle *attrs)
1563 {
1564         struct ib_uverbs_ex_create_qp cmd;
1565         int ret;
1566
1567         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1568         if (ret)
1569                 return ret;
1570
1571         if (cmd.comp_mask & ~IB_UVERBS_CREATE_QP_SUP_COMP_MASK)
1572                 return -EINVAL;
1573
1574         if (cmd.reserved)
1575                 return -EINVAL;
1576
1577         return create_qp(attrs, &cmd);
1578 }
1579
1580 static int ib_uverbs_open_qp(struct uverbs_attr_bundle *attrs)
1581 {
1582         struct ib_uverbs_open_qp        cmd;
1583         struct ib_uverbs_create_qp_resp resp;
1584         struct ib_uqp_object           *obj;
1585         struct ib_xrcd                 *xrcd;
1586         struct ib_uobject              *uninitialized_var(xrcd_uobj);
1587         struct ib_qp                   *qp;
1588         struct ib_qp_open_attr          attr;
1589         int ret;
1590         struct ib_device *ib_dev;
1591
1592         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1593         if (ret)
1594                 return ret;
1595
1596         obj = (struct ib_uqp_object *)uobj_alloc(UVERBS_OBJECT_QP, attrs,
1597                                                  &ib_dev);
1598         if (IS_ERR(obj))
1599                 return PTR_ERR(obj);
1600
1601         xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd.pd_handle, attrs);
1602         if (IS_ERR(xrcd_uobj)) {
1603                 ret = -EINVAL;
1604                 goto err_put;
1605         }
1606
1607         xrcd = (struct ib_xrcd *)xrcd_uobj->object;
1608         if (!xrcd) {
1609                 ret = -EINVAL;
1610                 goto err_xrcd;
1611         }
1612
1613         attr.event_handler = ib_uverbs_qp_event_handler;
1614         attr.qp_context    = attrs->ufile;
1615         attr.qp_num        = cmd.qpn;
1616         attr.qp_type       = cmd.qp_type;
1617
1618         obj->uevent.events_reported = 0;
1619         INIT_LIST_HEAD(&obj->uevent.event_list);
1620         INIT_LIST_HEAD(&obj->mcast_list);
1621
1622         qp = ib_open_qp(xrcd, &attr);
1623         if (IS_ERR(qp)) {
1624                 ret = PTR_ERR(qp);
1625                 goto err_xrcd;
1626         }
1627
1628         obj->uevent.uobject.object = qp;
1629         obj->uevent.uobject.user_handle = cmd.user_handle;
1630
1631         memset(&resp, 0, sizeof resp);
1632         resp.qpn       = qp->qp_num;
1633         resp.qp_handle = obj->uevent.uobject.id;
1634
1635         ret = uverbs_response(attrs, &resp, sizeof(resp));
1636         if (ret)
1637                 goto err_destroy;
1638
1639         obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object, uobject);
1640         atomic_inc(&obj->uxrcd->refcnt);
1641         qp->uobject = &obj->uevent.uobject;
1642         uobj_put_read(xrcd_uobj);
1643
1644         return uobj_alloc_commit(&obj->uevent.uobject);
1645
1646 err_destroy:
1647         ib_destroy_qp(qp);
1648 err_xrcd:
1649         uobj_put_read(xrcd_uobj);
1650 err_put:
1651         uobj_alloc_abort(&obj->uevent.uobject);
1652         return ret;
1653 }
1654
1655 static void copy_ah_attr_to_uverbs(struct ib_uverbs_qp_dest *uverb_attr,
1656                                    struct rdma_ah_attr *rdma_attr)
1657 {
1658         const struct ib_global_route   *grh;
1659
1660         uverb_attr->dlid              = rdma_ah_get_dlid(rdma_attr);
1661         uverb_attr->sl                = rdma_ah_get_sl(rdma_attr);
1662         uverb_attr->src_path_bits     = rdma_ah_get_path_bits(rdma_attr);
1663         uverb_attr->static_rate       = rdma_ah_get_static_rate(rdma_attr);
1664         uverb_attr->is_global         = !!(rdma_ah_get_ah_flags(rdma_attr) &
1665                                          IB_AH_GRH);
1666         if (uverb_attr->is_global) {
1667                 grh = rdma_ah_read_grh(rdma_attr);
1668                 memcpy(uverb_attr->dgid, grh->dgid.raw, 16);
1669                 uverb_attr->flow_label        = grh->flow_label;
1670                 uverb_attr->sgid_index        = grh->sgid_index;
1671                 uverb_attr->hop_limit         = grh->hop_limit;
1672                 uverb_attr->traffic_class     = grh->traffic_class;
1673         }
1674         uverb_attr->port_num          = rdma_ah_get_port_num(rdma_attr);
1675 }
1676
1677 static int ib_uverbs_query_qp(struct uverbs_attr_bundle *attrs)
1678 {
1679         struct ib_uverbs_query_qp      cmd;
1680         struct ib_uverbs_query_qp_resp resp;
1681         struct ib_qp                   *qp;
1682         struct ib_qp_attr              *attr;
1683         struct ib_qp_init_attr         *init_attr;
1684         int                            ret;
1685
1686         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1687         if (ret)
1688                 return ret;
1689
1690         attr      = kmalloc(sizeof *attr, GFP_KERNEL);
1691         init_attr = kmalloc(sizeof *init_attr, GFP_KERNEL);
1692         if (!attr || !init_attr) {
1693                 ret = -ENOMEM;
1694                 goto out;
1695         }
1696
1697         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
1698         if (!qp) {
1699                 ret = -EINVAL;
1700                 goto out;
1701         }
1702
1703         ret = ib_query_qp(qp, attr, cmd.attr_mask, init_attr);
1704
1705         uobj_put_obj_read(qp);
1706
1707         if (ret)
1708                 goto out;
1709
1710         memset(&resp, 0, sizeof resp);
1711
1712         resp.qp_state               = attr->qp_state;
1713         resp.cur_qp_state           = attr->cur_qp_state;
1714         resp.path_mtu               = attr->path_mtu;
1715         resp.path_mig_state         = attr->path_mig_state;
1716         resp.qkey                   = attr->qkey;
1717         resp.rq_psn                 = attr->rq_psn;
1718         resp.sq_psn                 = attr->sq_psn;
1719         resp.dest_qp_num            = attr->dest_qp_num;
1720         resp.qp_access_flags        = attr->qp_access_flags;
1721         resp.pkey_index             = attr->pkey_index;
1722         resp.alt_pkey_index         = attr->alt_pkey_index;
1723         resp.sq_draining            = attr->sq_draining;
1724         resp.max_rd_atomic          = attr->max_rd_atomic;
1725         resp.max_dest_rd_atomic     = attr->max_dest_rd_atomic;
1726         resp.min_rnr_timer          = attr->min_rnr_timer;
1727         resp.port_num               = attr->port_num;
1728         resp.timeout                = attr->timeout;
1729         resp.retry_cnt              = attr->retry_cnt;
1730         resp.rnr_retry              = attr->rnr_retry;
1731         resp.alt_port_num           = attr->alt_port_num;
1732         resp.alt_timeout            = attr->alt_timeout;
1733
1734         copy_ah_attr_to_uverbs(&resp.dest, &attr->ah_attr);
1735         copy_ah_attr_to_uverbs(&resp.alt_dest, &attr->alt_ah_attr);
1736
1737         resp.max_send_wr            = init_attr->cap.max_send_wr;
1738         resp.max_recv_wr            = init_attr->cap.max_recv_wr;
1739         resp.max_send_sge           = init_attr->cap.max_send_sge;
1740         resp.max_recv_sge           = init_attr->cap.max_recv_sge;
1741         resp.max_inline_data        = init_attr->cap.max_inline_data;
1742         resp.sq_sig_all             = init_attr->sq_sig_type == IB_SIGNAL_ALL_WR;
1743
1744         ret = uverbs_response(attrs, &resp, sizeof(resp));
1745
1746 out:
1747         kfree(attr);
1748         kfree(init_attr);
1749
1750         return ret;
1751 }
1752
1753 /* Remove ignored fields set in the attribute mask */
1754 static int modify_qp_mask(enum ib_qp_type qp_type, int mask)
1755 {
1756         switch (qp_type) {
1757         case IB_QPT_XRC_INI:
1758                 return mask & ~(IB_QP_MAX_DEST_RD_ATOMIC | IB_QP_MIN_RNR_TIMER);
1759         case IB_QPT_XRC_TGT:
1760                 return mask & ~(IB_QP_MAX_QP_RD_ATOMIC | IB_QP_RETRY_CNT |
1761                                 IB_QP_RNR_RETRY);
1762         default:
1763                 return mask;
1764         }
1765 }
1766
1767 static void copy_ah_attr_from_uverbs(struct ib_device *dev,
1768                                      struct rdma_ah_attr *rdma_attr,
1769                                      struct ib_uverbs_qp_dest *uverb_attr)
1770 {
1771         rdma_attr->type = rdma_ah_find_type(dev, uverb_attr->port_num);
1772         if (uverb_attr->is_global) {
1773                 rdma_ah_set_grh(rdma_attr, NULL,
1774                                 uverb_attr->flow_label,
1775                                 uverb_attr->sgid_index,
1776                                 uverb_attr->hop_limit,
1777                                 uverb_attr->traffic_class);
1778                 rdma_ah_set_dgid_raw(rdma_attr, uverb_attr->dgid);
1779         } else {
1780                 rdma_ah_set_ah_flags(rdma_attr, 0);
1781         }
1782         rdma_ah_set_dlid(rdma_attr, uverb_attr->dlid);
1783         rdma_ah_set_sl(rdma_attr, uverb_attr->sl);
1784         rdma_ah_set_path_bits(rdma_attr, uverb_attr->src_path_bits);
1785         rdma_ah_set_static_rate(rdma_attr, uverb_attr->static_rate);
1786         rdma_ah_set_port_num(rdma_attr, uverb_attr->port_num);
1787         rdma_ah_set_make_grd(rdma_attr, false);
1788 }
1789
1790 static int modify_qp(struct uverbs_attr_bundle *attrs,
1791                      struct ib_uverbs_ex_modify_qp *cmd)
1792 {
1793         struct ib_qp_attr *attr;
1794         struct ib_qp *qp;
1795         int ret;
1796
1797         attr = kzalloc(sizeof(*attr), GFP_KERNEL);
1798         if (!attr)
1799                 return -ENOMEM;
1800
1801         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd->base.qp_handle,
1802                                attrs);
1803         if (!qp) {
1804                 ret = -EINVAL;
1805                 goto out;
1806         }
1807
1808         if ((cmd->base.attr_mask & IB_QP_PORT) &&
1809             !rdma_is_port_valid(qp->device, cmd->base.port_num)) {
1810                 ret = -EINVAL;
1811                 goto release_qp;
1812         }
1813
1814         if ((cmd->base.attr_mask & IB_QP_AV)) {
1815                 if (!rdma_is_port_valid(qp->device, cmd->base.dest.port_num)) {
1816                         ret = -EINVAL;
1817                         goto release_qp;
1818                 }
1819
1820                 if (cmd->base.attr_mask & IB_QP_STATE &&
1821                     cmd->base.qp_state == IB_QPS_RTR) {
1822                 /* We are in INIT->RTR TRANSITION (if we are not,
1823                  * this transition will be rejected in subsequent checks).
1824                  * In the INIT->RTR transition, we cannot have IB_QP_PORT set,
1825                  * but the IB_QP_STATE flag is required.
1826                  *
1827                  * Since kernel 3.14 (commit dbf727de7440), the uverbs driver,
1828                  * when IB_QP_AV is set, has required inclusion of a valid
1829                  * port number in the primary AV. (AVs are created and handled
1830                  * differently for infiniband and ethernet (RoCE) ports).
1831                  *
1832                  * Check the port number included in the primary AV against
1833                  * the port number in the qp struct, which was set (and saved)
1834                  * in the RST->INIT transition.
1835                  */
1836                         if (cmd->base.dest.port_num != qp->real_qp->port) {
1837                                 ret = -EINVAL;
1838                                 goto release_qp;
1839                         }
1840                 } else {
1841                 /* We are in SQD->SQD. (If we are not, this transition will
1842                  * be rejected later in the verbs layer checks).
1843                  * Check for both IB_QP_PORT and IB_QP_AV, these can be set
1844                  * together in the SQD->SQD transition.
1845                  *
1846                  * If only IP_QP_AV was set, add in IB_QP_PORT as well (the
1847                  * verbs layer driver does not track primary port changes
1848                  * resulting from path migration. Thus, in SQD, if the primary
1849                  * AV is modified, the primary port should also be modified).
1850                  *
1851                  * Note that in this transition, the IB_QP_STATE flag
1852                  * is not allowed.
1853                  */
1854                         if (((cmd->base.attr_mask & (IB_QP_AV | IB_QP_PORT))
1855                              == (IB_QP_AV | IB_QP_PORT)) &&
1856                             cmd->base.port_num != cmd->base.dest.port_num) {
1857                                 ret = -EINVAL;
1858                                 goto release_qp;
1859                         }
1860                         if ((cmd->base.attr_mask & (IB_QP_AV | IB_QP_PORT))
1861                             == IB_QP_AV) {
1862                                 cmd->base.attr_mask |= IB_QP_PORT;
1863                                 cmd->base.port_num = cmd->base.dest.port_num;
1864                         }
1865                 }
1866         }
1867
1868         if ((cmd->base.attr_mask & IB_QP_ALT_PATH) &&
1869             (!rdma_is_port_valid(qp->device, cmd->base.alt_port_num) ||
1870             !rdma_is_port_valid(qp->device, cmd->base.alt_dest.port_num) ||
1871             cmd->base.alt_port_num != cmd->base.alt_dest.port_num)) {
1872                 ret = -EINVAL;
1873                 goto release_qp;
1874         }
1875
1876         if ((cmd->base.attr_mask & IB_QP_CUR_STATE &&
1877             cmd->base.cur_qp_state > IB_QPS_ERR) ||
1878             (cmd->base.attr_mask & IB_QP_STATE &&
1879             cmd->base.qp_state > IB_QPS_ERR)) {
1880                 ret = -EINVAL;
1881                 goto release_qp;
1882         }
1883
1884         if (cmd->base.attr_mask & IB_QP_STATE)
1885                 attr->qp_state = cmd->base.qp_state;
1886         if (cmd->base.attr_mask & IB_QP_CUR_STATE)
1887                 attr->cur_qp_state = cmd->base.cur_qp_state;
1888         if (cmd->base.attr_mask & IB_QP_PATH_MTU)
1889                 attr->path_mtu = cmd->base.path_mtu;
1890         if (cmd->base.attr_mask & IB_QP_PATH_MIG_STATE)
1891                 attr->path_mig_state = cmd->base.path_mig_state;
1892         if (cmd->base.attr_mask & IB_QP_QKEY)
1893                 attr->qkey = cmd->base.qkey;
1894         if (cmd->base.attr_mask & IB_QP_RQ_PSN)
1895                 attr->rq_psn = cmd->base.rq_psn;
1896         if (cmd->base.attr_mask & IB_QP_SQ_PSN)
1897                 attr->sq_psn = cmd->base.sq_psn;
1898         if (cmd->base.attr_mask & IB_QP_DEST_QPN)
1899                 attr->dest_qp_num = cmd->base.dest_qp_num;
1900         if (cmd->base.attr_mask & IB_QP_ACCESS_FLAGS)
1901                 attr->qp_access_flags = cmd->base.qp_access_flags;
1902         if (cmd->base.attr_mask & IB_QP_PKEY_INDEX)
1903                 attr->pkey_index = cmd->base.pkey_index;
1904         if (cmd->base.attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY)
1905                 attr->en_sqd_async_notify = cmd->base.en_sqd_async_notify;
1906         if (cmd->base.attr_mask & IB_QP_MAX_QP_RD_ATOMIC)
1907                 attr->max_rd_atomic = cmd->base.max_rd_atomic;
1908         if (cmd->base.attr_mask & IB_QP_MAX_DEST_RD_ATOMIC)
1909                 attr->max_dest_rd_atomic = cmd->base.max_dest_rd_atomic;
1910         if (cmd->base.attr_mask & IB_QP_MIN_RNR_TIMER)
1911                 attr->min_rnr_timer = cmd->base.min_rnr_timer;
1912         if (cmd->base.attr_mask & IB_QP_PORT)
1913                 attr->port_num = cmd->base.port_num;
1914         if (cmd->base.attr_mask & IB_QP_TIMEOUT)
1915                 attr->timeout = cmd->base.timeout;
1916         if (cmd->base.attr_mask & IB_QP_RETRY_CNT)
1917                 attr->retry_cnt = cmd->base.retry_cnt;
1918         if (cmd->base.attr_mask & IB_QP_RNR_RETRY)
1919                 attr->rnr_retry = cmd->base.rnr_retry;
1920         if (cmd->base.attr_mask & IB_QP_ALT_PATH) {
1921                 attr->alt_port_num = cmd->base.alt_port_num;
1922                 attr->alt_timeout = cmd->base.alt_timeout;
1923                 attr->alt_pkey_index = cmd->base.alt_pkey_index;
1924         }
1925         if (cmd->base.attr_mask & IB_QP_RATE_LIMIT)
1926                 attr->rate_limit = cmd->rate_limit;
1927
1928         if (cmd->base.attr_mask & IB_QP_AV)
1929                 copy_ah_attr_from_uverbs(qp->device, &attr->ah_attr,
1930                                          &cmd->base.dest);
1931
1932         if (cmd->base.attr_mask & IB_QP_ALT_PATH)
1933                 copy_ah_attr_from_uverbs(qp->device, &attr->alt_ah_attr,
1934                                          &cmd->base.alt_dest);
1935
1936         ret = ib_modify_qp_with_udata(qp, attr,
1937                                       modify_qp_mask(qp->qp_type,
1938                                                      cmd->base.attr_mask),
1939                                       &attrs->driver_udata);
1940
1941 release_qp:
1942         uobj_put_obj_read(qp);
1943 out:
1944         kfree(attr);
1945
1946         return ret;
1947 }
1948
1949 static int ib_uverbs_modify_qp(struct uverbs_attr_bundle *attrs)
1950 {
1951         struct ib_uverbs_ex_modify_qp cmd;
1952         int ret;
1953
1954         ret = uverbs_request(attrs, &cmd.base, sizeof(cmd.base));
1955         if (ret)
1956                 return ret;
1957
1958         if (cmd.base.attr_mask &
1959             ~((IB_USER_LEGACY_LAST_QP_ATTR_MASK << 1) - 1))
1960                 return -EOPNOTSUPP;
1961
1962         return modify_qp(attrs, &cmd);
1963 }
1964
1965 static int ib_uverbs_ex_modify_qp(struct uverbs_attr_bundle *attrs)
1966 {
1967         struct ib_uverbs_ex_modify_qp cmd;
1968         struct ib_uverbs_ex_modify_qp_resp resp = {
1969                 .response_length = uverbs_response_length(attrs, sizeof(resp))
1970         };
1971         int ret;
1972
1973         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
1974         if (ret)
1975                 return ret;
1976
1977         /*
1978          * Last bit is reserved for extending the attr_mask by
1979          * using another field.
1980          */
1981         BUILD_BUG_ON(IB_USER_LAST_QP_ATTR_MASK == (1 << 31));
1982
1983         if (cmd.base.attr_mask &
1984             ~((IB_USER_LAST_QP_ATTR_MASK << 1) - 1))
1985                 return -EOPNOTSUPP;
1986
1987         ret = modify_qp(attrs, &cmd);
1988         if (ret)
1989                 return ret;
1990
1991         return uverbs_response(attrs, &resp, sizeof(resp));
1992 }
1993
1994 static int ib_uverbs_destroy_qp(struct uverbs_attr_bundle *attrs)
1995 {
1996         struct ib_uverbs_destroy_qp      cmd;
1997         struct ib_uverbs_destroy_qp_resp resp;
1998         struct ib_uobject               *uobj;
1999         struct ib_uqp_object            *obj;
2000         int ret;
2001
2002         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
2003         if (ret)
2004                 return ret;
2005
2006         uobj = uobj_get_destroy(UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
2007         if (IS_ERR(uobj))
2008                 return PTR_ERR(uobj);
2009
2010         obj = container_of(uobj, struct ib_uqp_object, uevent.uobject);
2011         memset(&resp, 0, sizeof(resp));
2012         resp.events_reported = obj->uevent.events_reported;
2013
2014         uobj_put_destroy(uobj);
2015
2016         return uverbs_response(attrs, &resp, sizeof(resp));
2017 }
2018
2019 static void *alloc_wr(size_t wr_size, __u32 num_sge)
2020 {
2021         if (num_sge >= (U32_MAX - ALIGN(wr_size, sizeof (struct ib_sge))) /
2022                        sizeof (struct ib_sge))
2023                 return NULL;
2024
2025         return kmalloc(ALIGN(wr_size, sizeof (struct ib_sge)) +
2026                          num_sge * sizeof (struct ib_sge), GFP_KERNEL);
2027 }
2028
2029 static int ib_uverbs_post_send(struct uverbs_attr_bundle *attrs)
2030 {
2031         struct ib_uverbs_post_send      cmd;
2032         struct ib_uverbs_post_send_resp resp;
2033         struct ib_uverbs_send_wr       *user_wr;
2034         struct ib_send_wr              *wr = NULL, *last, *next;
2035         const struct ib_send_wr        *bad_wr;
2036         struct ib_qp                   *qp;
2037         int                             i, sg_ind;
2038         int                             is_ud;
2039         int ret, ret2;
2040         size_t                          next_size;
2041         const struct ib_sge __user *sgls;
2042         const void __user *wqes;
2043         struct uverbs_req_iter iter;
2044
2045         ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd));
2046         if (ret)
2047                 return ret;
2048         wqes = uverbs_request_next_ptr(&iter, cmd.wqe_size * cmd.wr_count);
2049         if (IS_ERR(wqes))
2050                 return PTR_ERR(wqes);
2051         sgls = uverbs_request_next_ptr(
2052                 &iter, cmd.sge_count * sizeof(struct ib_uverbs_sge));
2053         if (IS_ERR(sgls))
2054                 return PTR_ERR(sgls);
2055         ret = uverbs_request_finish(&iter);
2056         if (ret)
2057                 return ret;
2058
2059         user_wr = kmalloc(cmd.wqe_size, GFP_KERNEL);
2060         if (!user_wr)
2061                 return -ENOMEM;
2062
2063         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
2064         if (!qp)
2065                 goto out;
2066
2067         is_ud = qp->qp_type == IB_QPT_UD;
2068         sg_ind = 0;
2069         last = NULL;
2070         for (i = 0; i < cmd.wr_count; ++i) {
2071                 if (copy_from_user(user_wr, wqes + i * cmd.wqe_size,
2072                                    cmd.wqe_size)) {
2073                         ret = -EFAULT;
2074                         goto out_put;
2075                 }
2076
2077                 if (user_wr->num_sge + sg_ind > cmd.sge_count) {
2078                         ret = -EINVAL;
2079                         goto out_put;
2080                 }
2081
2082                 if (is_ud) {
2083                         struct ib_ud_wr *ud;
2084
2085                         if (user_wr->opcode != IB_WR_SEND &&
2086                             user_wr->opcode != IB_WR_SEND_WITH_IMM) {
2087                                 ret = -EINVAL;
2088                                 goto out_put;
2089                         }
2090
2091                         next_size = sizeof(*ud);
2092                         ud = alloc_wr(next_size, user_wr->num_sge);
2093                         if (!ud) {
2094                                 ret = -ENOMEM;
2095                                 goto out_put;
2096                         }
2097
2098                         ud->ah = uobj_get_obj_read(ah, UVERBS_OBJECT_AH,
2099                                                    user_wr->wr.ud.ah, attrs);
2100                         if (!ud->ah) {
2101                                 kfree(ud);
2102                                 ret = -EINVAL;
2103                                 goto out_put;
2104                         }
2105                         ud->remote_qpn = user_wr->wr.ud.remote_qpn;
2106                         ud->remote_qkey = user_wr->wr.ud.remote_qkey;
2107
2108                         next = &ud->wr;
2109                 } else if (user_wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM ||
2110                            user_wr->opcode == IB_WR_RDMA_WRITE ||
2111                            user_wr->opcode == IB_WR_RDMA_READ) {
2112                         struct ib_rdma_wr *rdma;
2113
2114                         next_size = sizeof(*rdma);
2115                         rdma = alloc_wr(next_size, user_wr->num_sge);
2116                         if (!rdma) {
2117                                 ret = -ENOMEM;
2118                                 goto out_put;
2119                         }
2120
2121                         rdma->remote_addr = user_wr->wr.rdma.remote_addr;
2122                         rdma->rkey = user_wr->wr.rdma.rkey;
2123
2124                         next = &rdma->wr;
2125                 } else if (user_wr->opcode == IB_WR_ATOMIC_CMP_AND_SWP ||
2126                            user_wr->opcode == IB_WR_ATOMIC_FETCH_AND_ADD) {
2127                         struct ib_atomic_wr *atomic;
2128
2129                         next_size = sizeof(*atomic);
2130                         atomic = alloc_wr(next_size, user_wr->num_sge);
2131                         if (!atomic) {
2132                                 ret = -ENOMEM;
2133                                 goto out_put;
2134                         }
2135
2136                         atomic->remote_addr = user_wr->wr.atomic.remote_addr;
2137                         atomic->compare_add = user_wr->wr.atomic.compare_add;
2138                         atomic->swap = user_wr->wr.atomic.swap;
2139                         atomic->rkey = user_wr->wr.atomic.rkey;
2140
2141                         next = &atomic->wr;
2142                 } else if (user_wr->opcode == IB_WR_SEND ||
2143                            user_wr->opcode == IB_WR_SEND_WITH_IMM ||
2144                            user_wr->opcode == IB_WR_SEND_WITH_INV) {
2145                         next_size = sizeof(*next);
2146                         next = alloc_wr(next_size, user_wr->num_sge);
2147                         if (!next) {
2148                                 ret = -ENOMEM;
2149                                 goto out_put;
2150                         }
2151                 } else {
2152                         ret = -EINVAL;
2153                         goto out_put;
2154                 }
2155
2156                 if (user_wr->opcode == IB_WR_SEND_WITH_IMM ||
2157                     user_wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) {
2158                         next->ex.imm_data =
2159                                         (__be32 __force) user_wr->ex.imm_data;
2160                 } else if (user_wr->opcode == IB_WR_SEND_WITH_INV) {
2161                         next->ex.invalidate_rkey = user_wr->ex.invalidate_rkey;
2162                 }
2163
2164                 if (!last)
2165                         wr = next;
2166                 else
2167                         last->next = next;
2168                 last = next;
2169
2170                 next->next       = NULL;
2171                 next->wr_id      = user_wr->wr_id;
2172                 next->num_sge    = user_wr->num_sge;
2173                 next->opcode     = user_wr->opcode;
2174                 next->send_flags = user_wr->send_flags;
2175
2176                 if (next->num_sge) {
2177                         next->sg_list = (void *) next +
2178                                 ALIGN(next_size, sizeof(struct ib_sge));
2179                         if (copy_from_user(next->sg_list, sgls + sg_ind,
2180                                            next->num_sge *
2181                                                    sizeof(struct ib_sge))) {
2182                                 ret = -EFAULT;
2183                                 goto out_put;
2184                         }
2185                         sg_ind += next->num_sge;
2186                 } else
2187                         next->sg_list = NULL;
2188         }
2189
2190         resp.bad_wr = 0;
2191         ret = qp->device->post_send(qp->real_qp, wr, &bad_wr);
2192         if (ret)
2193                 for (next = wr; next; next = next->next) {
2194                         ++resp.bad_wr;
2195                         if (next == bad_wr)
2196                                 break;
2197                 }
2198
2199         ret2 = uverbs_response(attrs, &resp, sizeof(resp));
2200         if (ret2)
2201                 ret = ret2;
2202
2203 out_put:
2204         uobj_put_obj_read(qp);
2205
2206         while (wr) {
2207                 if (is_ud && ud_wr(wr)->ah)
2208                         uobj_put_obj_read(ud_wr(wr)->ah);
2209                 next = wr->next;
2210                 kfree(wr);
2211                 wr = next;
2212         }
2213
2214 out:
2215         kfree(user_wr);
2216
2217         return ret;
2218 }
2219
2220 static struct ib_recv_wr *
2221 ib_uverbs_unmarshall_recv(struct uverbs_req_iter *iter, u32 wr_count,
2222                           u32 wqe_size, u32 sge_count)
2223 {
2224         struct ib_uverbs_recv_wr *user_wr;
2225         struct ib_recv_wr        *wr = NULL, *last, *next;
2226         int                       sg_ind;
2227         int                       i;
2228         int                       ret;
2229         const struct ib_sge __user *sgls;
2230         const void __user *wqes;
2231
2232         if (wqe_size < sizeof (struct ib_uverbs_recv_wr))
2233                 return ERR_PTR(-EINVAL);
2234
2235         wqes = uverbs_request_next_ptr(iter, wqe_size * wr_count);
2236         if (IS_ERR(wqes))
2237                 return ERR_CAST(wqes);
2238         sgls = uverbs_request_next_ptr(
2239                 iter, sge_count * sizeof(struct ib_uverbs_sge));
2240         if (IS_ERR(sgls))
2241                 return ERR_CAST(sgls);
2242         ret = uverbs_request_finish(iter);
2243         if (ret)
2244                 return ERR_PTR(ret);
2245
2246         user_wr = kmalloc(wqe_size, GFP_KERNEL);
2247         if (!user_wr)
2248                 return ERR_PTR(-ENOMEM);
2249
2250         sg_ind = 0;
2251         last = NULL;
2252         for (i = 0; i < wr_count; ++i) {
2253                 if (copy_from_user(user_wr, wqes + i * wqe_size,
2254                                    wqe_size)) {
2255                         ret = -EFAULT;
2256                         goto err;
2257                 }
2258
2259                 if (user_wr->num_sge + sg_ind > sge_count) {
2260                         ret = -EINVAL;
2261                         goto err;
2262                 }
2263
2264                 if (user_wr->num_sge >=
2265                     (U32_MAX - ALIGN(sizeof *next, sizeof (struct ib_sge))) /
2266                     sizeof (struct ib_sge)) {
2267                         ret = -EINVAL;
2268                         goto err;
2269                 }
2270
2271                 next = kmalloc(ALIGN(sizeof *next, sizeof (struct ib_sge)) +
2272                                user_wr->num_sge * sizeof (struct ib_sge),
2273                                GFP_KERNEL);
2274                 if (!next) {
2275                         ret = -ENOMEM;
2276                         goto err;
2277                 }
2278
2279                 if (!last)
2280                         wr = next;
2281                 else
2282                         last->next = next;
2283                 last = next;
2284
2285                 next->next       = NULL;
2286                 next->wr_id      = user_wr->wr_id;
2287                 next->num_sge    = user_wr->num_sge;
2288
2289                 if (next->num_sge) {
2290                         next->sg_list = (void *) next +
2291                                 ALIGN(sizeof *next, sizeof (struct ib_sge));
2292                         if (copy_from_user(next->sg_list, sgls + sg_ind,
2293                                            next->num_sge *
2294                                                    sizeof(struct ib_sge))) {
2295                                 ret = -EFAULT;
2296                                 goto err;
2297                         }
2298                         sg_ind += next->num_sge;
2299                 } else
2300                         next->sg_list = NULL;
2301         }
2302
2303         kfree(user_wr);
2304         return wr;
2305
2306 err:
2307         kfree(user_wr);
2308
2309         while (wr) {
2310                 next = wr->next;
2311                 kfree(wr);
2312                 wr = next;
2313         }
2314
2315         return ERR_PTR(ret);
2316 }
2317
2318 static int ib_uverbs_post_recv(struct uverbs_attr_bundle *attrs)
2319 {
2320         struct ib_uverbs_post_recv      cmd;
2321         struct ib_uverbs_post_recv_resp resp;
2322         struct ib_recv_wr              *wr, *next;
2323         const struct ib_recv_wr        *bad_wr;
2324         struct ib_qp                   *qp;
2325         int ret, ret2;
2326         struct uverbs_req_iter iter;
2327
2328         ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd));
2329         if (ret)
2330                 return ret;
2331
2332         wr = ib_uverbs_unmarshall_recv(&iter, cmd.wr_count, cmd.wqe_size,
2333                                        cmd.sge_count);
2334         if (IS_ERR(wr))
2335                 return PTR_ERR(wr);
2336
2337         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
2338         if (!qp) {
2339                 ret = -EINVAL;
2340                 goto out;
2341         }
2342
2343         resp.bad_wr = 0;
2344         ret = qp->device->post_recv(qp->real_qp, wr, &bad_wr);
2345
2346         uobj_put_obj_read(qp);
2347         if (ret) {
2348                 for (next = wr; next; next = next->next) {
2349                         ++resp.bad_wr;
2350                         if (next == bad_wr)
2351                                 break;
2352                 }
2353         }
2354
2355         ret2 = uverbs_response(attrs, &resp, sizeof(resp));
2356         if (ret2)
2357                 ret = ret2;
2358 out:
2359         while (wr) {
2360                 next = wr->next;
2361                 kfree(wr);
2362                 wr = next;
2363         }
2364
2365         return ret;
2366 }
2367
2368 static int ib_uverbs_post_srq_recv(struct uverbs_attr_bundle *attrs)
2369 {
2370         struct ib_uverbs_post_srq_recv      cmd;
2371         struct ib_uverbs_post_srq_recv_resp resp;
2372         struct ib_recv_wr                  *wr, *next;
2373         const struct ib_recv_wr            *bad_wr;
2374         struct ib_srq                      *srq;
2375         int ret, ret2;
2376         struct uverbs_req_iter iter;
2377
2378         ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd));
2379         if (ret)
2380                 return ret;
2381
2382         wr = ib_uverbs_unmarshall_recv(&iter, cmd.wr_count, cmd.wqe_size,
2383                                        cmd.sge_count);
2384         if (IS_ERR(wr))
2385                 return PTR_ERR(wr);
2386
2387         srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs);
2388         if (!srq) {
2389                 ret = -EINVAL;
2390                 goto out;
2391         }
2392
2393         resp.bad_wr = 0;
2394         ret = srq->device->post_srq_recv(srq, wr, &bad_wr);
2395
2396         uobj_put_obj_read(srq);
2397
2398         if (ret)
2399                 for (next = wr; next; next = next->next) {
2400                         ++resp.bad_wr;
2401                         if (next == bad_wr)
2402                                 break;
2403                 }
2404
2405         ret2 = uverbs_response(attrs, &resp, sizeof(resp));
2406         if (ret2)
2407                 ret = ret2;
2408
2409 out:
2410         while (wr) {
2411                 next = wr->next;
2412                 kfree(wr);
2413                 wr = next;
2414         }
2415
2416         return ret;
2417 }
2418
2419 static int ib_uverbs_create_ah(struct uverbs_attr_bundle *attrs)
2420 {
2421         struct ib_uverbs_create_ah       cmd;
2422         struct ib_uverbs_create_ah_resp  resp;
2423         struct ib_uobject               *uobj;
2424         struct ib_pd                    *pd;
2425         struct ib_ah                    *ah;
2426         struct rdma_ah_attr             attr = {};
2427         int ret;
2428         struct ib_device *ib_dev;
2429
2430         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
2431         if (ret)
2432                 return ret;
2433
2434         uobj = uobj_alloc(UVERBS_OBJECT_AH, attrs, &ib_dev);
2435         if (IS_ERR(uobj))
2436                 return PTR_ERR(uobj);
2437
2438         if (!rdma_is_port_valid(ib_dev, cmd.attr.port_num)) {
2439                 ret = -EINVAL;
2440                 goto err;
2441         }
2442
2443         pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs);
2444         if (!pd) {
2445                 ret = -EINVAL;
2446                 goto err;
2447         }
2448
2449         attr.type = rdma_ah_find_type(ib_dev, cmd.attr.port_num);
2450         rdma_ah_set_make_grd(&attr, false);
2451         rdma_ah_set_dlid(&attr, cmd.attr.dlid);
2452         rdma_ah_set_sl(&attr, cmd.attr.sl);
2453         rdma_ah_set_path_bits(&attr, cmd.attr.src_path_bits);
2454         rdma_ah_set_static_rate(&attr, cmd.attr.static_rate);
2455         rdma_ah_set_port_num(&attr, cmd.attr.port_num);
2456
2457         if (cmd.attr.is_global) {
2458                 rdma_ah_set_grh(&attr, NULL, cmd.attr.grh.flow_label,
2459                                 cmd.attr.grh.sgid_index,
2460                                 cmd.attr.grh.hop_limit,
2461                                 cmd.attr.grh.traffic_class);
2462                 rdma_ah_set_dgid_raw(&attr, cmd.attr.grh.dgid);
2463         } else {
2464                 rdma_ah_set_ah_flags(&attr, 0);
2465         }
2466
2467         ah = rdma_create_user_ah(pd, &attr, &attrs->driver_udata);
2468         if (IS_ERR(ah)) {
2469                 ret = PTR_ERR(ah);
2470                 goto err_put;
2471         }
2472
2473         ah->uobject  = uobj;
2474         uobj->user_handle = cmd.user_handle;
2475         uobj->object = ah;
2476
2477         resp.ah_handle = uobj->id;
2478
2479         ret = uverbs_response(attrs, &resp, sizeof(resp));
2480         if (ret)
2481                 goto err_copy;
2482
2483         uobj_put_obj_read(pd);
2484         return uobj_alloc_commit(uobj);
2485
2486 err_copy:
2487         rdma_destroy_ah(ah);
2488
2489 err_put:
2490         uobj_put_obj_read(pd);
2491
2492 err:
2493         uobj_alloc_abort(uobj);
2494         return ret;
2495 }
2496
2497 static int ib_uverbs_destroy_ah(struct uverbs_attr_bundle *attrs)
2498 {
2499         struct ib_uverbs_destroy_ah cmd;
2500         int ret;
2501
2502         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
2503         if (ret)
2504                 return ret;
2505
2506         return uobj_perform_destroy(UVERBS_OBJECT_AH, cmd.ah_handle, attrs);
2507 }
2508
2509 static int ib_uverbs_attach_mcast(struct uverbs_attr_bundle *attrs)
2510 {
2511         struct ib_uverbs_attach_mcast cmd;
2512         struct ib_qp                 *qp;
2513         struct ib_uqp_object         *obj;
2514         struct ib_uverbs_mcast_entry *mcast;
2515         int                           ret;
2516
2517         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
2518         if (ret)
2519                 return ret;
2520
2521         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
2522         if (!qp)
2523                 return -EINVAL;
2524
2525         obj = container_of(qp->uobject, struct ib_uqp_object, uevent.uobject);
2526
2527         mutex_lock(&obj->mcast_lock);
2528         list_for_each_entry(mcast, &obj->mcast_list, list)
2529                 if (cmd.mlid == mcast->lid &&
2530                     !memcmp(cmd.gid, mcast->gid.raw, sizeof mcast->gid.raw)) {
2531                         ret = 0;
2532                         goto out_put;
2533                 }
2534
2535         mcast = kmalloc(sizeof *mcast, GFP_KERNEL);
2536         if (!mcast) {
2537                 ret = -ENOMEM;
2538                 goto out_put;
2539         }
2540
2541         mcast->lid = cmd.mlid;
2542         memcpy(mcast->gid.raw, cmd.gid, sizeof mcast->gid.raw);
2543
2544         ret = ib_attach_mcast(qp, &mcast->gid, cmd.mlid);
2545         if (!ret)
2546                 list_add_tail(&mcast->list, &obj->mcast_list);
2547         else
2548                 kfree(mcast);
2549
2550 out_put:
2551         mutex_unlock(&obj->mcast_lock);
2552         uobj_put_obj_read(qp);
2553
2554         return ret;
2555 }
2556
2557 static int ib_uverbs_detach_mcast(struct uverbs_attr_bundle *attrs)
2558 {
2559         struct ib_uverbs_detach_mcast cmd;
2560         struct ib_uqp_object         *obj;
2561         struct ib_qp                 *qp;
2562         struct ib_uverbs_mcast_entry *mcast;
2563         int                           ret = -EINVAL;
2564         bool                          found = false;
2565
2566         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
2567         if (ret)
2568                 return ret;
2569
2570         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
2571         if (!qp)
2572                 return -EINVAL;
2573
2574         obj = container_of(qp->uobject, struct ib_uqp_object, uevent.uobject);
2575         mutex_lock(&obj->mcast_lock);
2576
2577         list_for_each_entry(mcast, &obj->mcast_list, list)
2578                 if (cmd.mlid == mcast->lid &&
2579                     !memcmp(cmd.gid, mcast->gid.raw, sizeof mcast->gid.raw)) {
2580                         list_del(&mcast->list);
2581                         kfree(mcast);
2582                         found = true;
2583                         break;
2584                 }
2585
2586         if (!found) {
2587                 ret = -EINVAL;
2588                 goto out_put;
2589         }
2590
2591         ret = ib_detach_mcast(qp, (union ib_gid *)cmd.gid, cmd.mlid);
2592
2593 out_put:
2594         mutex_unlock(&obj->mcast_lock);
2595         uobj_put_obj_read(qp);
2596         return ret;
2597 }
2598
2599 struct ib_uflow_resources *flow_resources_alloc(size_t num_specs)
2600 {
2601         struct ib_uflow_resources *resources;
2602
2603         resources = kzalloc(sizeof(*resources), GFP_KERNEL);
2604
2605         if (!resources)
2606                 return NULL;
2607
2608         if (!num_specs)
2609                 goto out;
2610
2611         resources->counters =
2612                 kcalloc(num_specs, sizeof(*resources->counters), GFP_KERNEL);
2613         resources->collection =
2614                 kcalloc(num_specs, sizeof(*resources->collection), GFP_KERNEL);
2615
2616         if (!resources->counters || !resources->collection)
2617                 goto err;
2618
2619 out:
2620         resources->max = num_specs;
2621         return resources;
2622
2623 err:
2624         kfree(resources->counters);
2625         kfree(resources);
2626
2627         return NULL;
2628 }
2629 EXPORT_SYMBOL(flow_resources_alloc);
2630
2631 void ib_uverbs_flow_resources_free(struct ib_uflow_resources *uflow_res)
2632 {
2633         unsigned int i;
2634
2635         if (!uflow_res)
2636                 return;
2637
2638         for (i = 0; i < uflow_res->collection_num; i++)
2639                 atomic_dec(&uflow_res->collection[i]->usecnt);
2640
2641         for (i = 0; i < uflow_res->counters_num; i++)
2642                 atomic_dec(&uflow_res->counters[i]->usecnt);
2643
2644         kfree(uflow_res->collection);
2645         kfree(uflow_res->counters);
2646         kfree(uflow_res);
2647 }
2648 EXPORT_SYMBOL(ib_uverbs_flow_resources_free);
2649
2650 void flow_resources_add(struct ib_uflow_resources *uflow_res,
2651                         enum ib_flow_spec_type type,
2652                         void *ibobj)
2653 {
2654         WARN_ON(uflow_res->num >= uflow_res->max);
2655
2656         switch (type) {
2657         case IB_FLOW_SPEC_ACTION_HANDLE:
2658                 atomic_inc(&((struct ib_flow_action *)ibobj)->usecnt);
2659                 uflow_res->collection[uflow_res->collection_num++] =
2660                         (struct ib_flow_action *)ibobj;
2661                 break;
2662         case IB_FLOW_SPEC_ACTION_COUNT:
2663                 atomic_inc(&((struct ib_counters *)ibobj)->usecnt);
2664                 uflow_res->counters[uflow_res->counters_num++] =
2665                         (struct ib_counters *)ibobj;
2666                 break;
2667         default:
2668                 WARN_ON(1);
2669         }
2670
2671         uflow_res->num++;
2672 }
2673 EXPORT_SYMBOL(flow_resources_add);
2674
2675 static int kern_spec_to_ib_spec_action(const struct uverbs_attr_bundle *attrs,
2676                                        struct ib_uverbs_flow_spec *kern_spec,
2677                                        union ib_flow_spec *ib_spec,
2678                                        struct ib_uflow_resources *uflow_res)
2679 {
2680         ib_spec->type = kern_spec->type;
2681         switch (ib_spec->type) {
2682         case IB_FLOW_SPEC_ACTION_TAG:
2683                 if (kern_spec->flow_tag.size !=
2684                     sizeof(struct ib_uverbs_flow_spec_action_tag))
2685                         return -EINVAL;
2686
2687                 ib_spec->flow_tag.size = sizeof(struct ib_flow_spec_action_tag);
2688                 ib_spec->flow_tag.tag_id = kern_spec->flow_tag.tag_id;
2689                 break;
2690         case IB_FLOW_SPEC_ACTION_DROP:
2691                 if (kern_spec->drop.size !=
2692                     sizeof(struct ib_uverbs_flow_spec_action_drop))
2693                         return -EINVAL;
2694
2695                 ib_spec->drop.size = sizeof(struct ib_flow_spec_action_drop);
2696                 break;
2697         case IB_FLOW_SPEC_ACTION_HANDLE:
2698                 if (kern_spec->action.size !=
2699                     sizeof(struct ib_uverbs_flow_spec_action_handle))
2700                         return -EOPNOTSUPP;
2701                 ib_spec->action.act = uobj_get_obj_read(flow_action,
2702                                                         UVERBS_OBJECT_FLOW_ACTION,
2703                                                         kern_spec->action.handle,
2704                                                         attrs);
2705                 if (!ib_spec->action.act)
2706                         return -EINVAL;
2707                 ib_spec->action.size =
2708                         sizeof(struct ib_flow_spec_action_handle);
2709                 flow_resources_add(uflow_res,
2710                                    IB_FLOW_SPEC_ACTION_HANDLE,
2711                                    ib_spec->action.act);
2712                 uobj_put_obj_read(ib_spec->action.act);
2713                 break;
2714         case IB_FLOW_SPEC_ACTION_COUNT:
2715                 if (kern_spec->flow_count.size !=
2716                         sizeof(struct ib_uverbs_flow_spec_action_count))
2717                         return -EINVAL;
2718                 ib_spec->flow_count.counters =
2719                         uobj_get_obj_read(counters,
2720                                           UVERBS_OBJECT_COUNTERS,
2721                                           kern_spec->flow_count.handle,
2722                                           attrs);
2723                 if (!ib_spec->flow_count.counters)
2724                         return -EINVAL;
2725                 ib_spec->flow_count.size =
2726                                 sizeof(struct ib_flow_spec_action_count);
2727                 flow_resources_add(uflow_res,
2728                                    IB_FLOW_SPEC_ACTION_COUNT,
2729                                    ib_spec->flow_count.counters);
2730                 uobj_put_obj_read(ib_spec->flow_count.counters);
2731                 break;
2732         default:
2733                 return -EINVAL;
2734         }
2735         return 0;
2736 }
2737
2738 static size_t kern_spec_filter_sz(const struct ib_uverbs_flow_spec_hdr *spec)
2739 {
2740         /* Returns user space filter size, includes padding */
2741         return (spec->size - sizeof(struct ib_uverbs_flow_spec_hdr)) / 2;
2742 }
2743
2744 static ssize_t spec_filter_size(const void *kern_spec_filter, u16 kern_filter_size,
2745                                 u16 ib_real_filter_sz)
2746 {
2747         /*
2748          * User space filter structures must be 64 bit aligned, otherwise this
2749          * may pass, but we won't handle additional new attributes.
2750          */
2751
2752         if (kern_filter_size > ib_real_filter_sz) {
2753                 if (memchr_inv(kern_spec_filter +
2754                                ib_real_filter_sz, 0,
2755                                kern_filter_size - ib_real_filter_sz))
2756                         return -EINVAL;
2757                 return ib_real_filter_sz;
2758         }
2759         return kern_filter_size;
2760 }
2761
2762 int ib_uverbs_kern_spec_to_ib_spec_filter(enum ib_flow_spec_type type,
2763                                           const void *kern_spec_mask,
2764                                           const void *kern_spec_val,
2765                                           size_t kern_filter_sz,
2766                                           union ib_flow_spec *ib_spec)
2767 {
2768         ssize_t actual_filter_sz;
2769         ssize_t ib_filter_sz;
2770
2771         /* User flow spec size must be aligned to 4 bytes */
2772         if (kern_filter_sz != ALIGN(kern_filter_sz, 4))
2773                 return -EINVAL;
2774
2775         ib_spec->type = type;
2776
2777         if (ib_spec->type == (IB_FLOW_SPEC_INNER | IB_FLOW_SPEC_VXLAN_TUNNEL))
2778                 return -EINVAL;
2779
2780         switch (ib_spec->type & ~IB_FLOW_SPEC_INNER) {
2781         case IB_FLOW_SPEC_ETH:
2782                 ib_filter_sz = offsetof(struct ib_flow_eth_filter, real_sz);
2783                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2784                                                     kern_filter_sz,
2785                                                     ib_filter_sz);
2786                 if (actual_filter_sz <= 0)
2787                         return -EINVAL;
2788                 ib_spec->size = sizeof(struct ib_flow_spec_eth);
2789                 memcpy(&ib_spec->eth.val, kern_spec_val, actual_filter_sz);
2790                 memcpy(&ib_spec->eth.mask, kern_spec_mask, actual_filter_sz);
2791                 break;
2792         case IB_FLOW_SPEC_IPV4:
2793                 ib_filter_sz = offsetof(struct ib_flow_ipv4_filter, real_sz);
2794                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2795                                                     kern_filter_sz,
2796                                                     ib_filter_sz);
2797                 if (actual_filter_sz <= 0)
2798                         return -EINVAL;
2799                 ib_spec->size = sizeof(struct ib_flow_spec_ipv4);
2800                 memcpy(&ib_spec->ipv4.val, kern_spec_val, actual_filter_sz);
2801                 memcpy(&ib_spec->ipv4.mask, kern_spec_mask, actual_filter_sz);
2802                 break;
2803         case IB_FLOW_SPEC_IPV6:
2804                 ib_filter_sz = offsetof(struct ib_flow_ipv6_filter, real_sz);
2805                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2806                                                     kern_filter_sz,
2807                                                     ib_filter_sz);
2808                 if (actual_filter_sz <= 0)
2809                         return -EINVAL;
2810                 ib_spec->size = sizeof(struct ib_flow_spec_ipv6);
2811                 memcpy(&ib_spec->ipv6.val, kern_spec_val, actual_filter_sz);
2812                 memcpy(&ib_spec->ipv6.mask, kern_spec_mask, actual_filter_sz);
2813
2814                 if ((ntohl(ib_spec->ipv6.mask.flow_label)) >= BIT(20) ||
2815                     (ntohl(ib_spec->ipv6.val.flow_label)) >= BIT(20))
2816                         return -EINVAL;
2817                 break;
2818         case IB_FLOW_SPEC_TCP:
2819         case IB_FLOW_SPEC_UDP:
2820                 ib_filter_sz = offsetof(struct ib_flow_tcp_udp_filter, real_sz);
2821                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2822                                                     kern_filter_sz,
2823                                                     ib_filter_sz);
2824                 if (actual_filter_sz <= 0)
2825                         return -EINVAL;
2826                 ib_spec->size = sizeof(struct ib_flow_spec_tcp_udp);
2827                 memcpy(&ib_spec->tcp_udp.val, kern_spec_val, actual_filter_sz);
2828                 memcpy(&ib_spec->tcp_udp.mask, kern_spec_mask, actual_filter_sz);
2829                 break;
2830         case IB_FLOW_SPEC_VXLAN_TUNNEL:
2831                 ib_filter_sz = offsetof(struct ib_flow_tunnel_filter, real_sz);
2832                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2833                                                     kern_filter_sz,
2834                                                     ib_filter_sz);
2835                 if (actual_filter_sz <= 0)
2836                         return -EINVAL;
2837                 ib_spec->tunnel.size = sizeof(struct ib_flow_spec_tunnel);
2838                 memcpy(&ib_spec->tunnel.val, kern_spec_val, actual_filter_sz);
2839                 memcpy(&ib_spec->tunnel.mask, kern_spec_mask, actual_filter_sz);
2840
2841                 if ((ntohl(ib_spec->tunnel.mask.tunnel_id)) >= BIT(24) ||
2842                     (ntohl(ib_spec->tunnel.val.tunnel_id)) >= BIT(24))
2843                         return -EINVAL;
2844                 break;
2845         case IB_FLOW_SPEC_ESP:
2846                 ib_filter_sz = offsetof(struct ib_flow_esp_filter, real_sz);
2847                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2848                                                     kern_filter_sz,
2849                                                     ib_filter_sz);
2850                 if (actual_filter_sz <= 0)
2851                         return -EINVAL;
2852                 ib_spec->esp.size = sizeof(struct ib_flow_spec_esp);
2853                 memcpy(&ib_spec->esp.val, kern_spec_val, actual_filter_sz);
2854                 memcpy(&ib_spec->esp.mask, kern_spec_mask, actual_filter_sz);
2855                 break;
2856         case IB_FLOW_SPEC_GRE:
2857                 ib_filter_sz = offsetof(struct ib_flow_gre_filter, real_sz);
2858                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2859                                                     kern_filter_sz,
2860                                                     ib_filter_sz);
2861                 if (actual_filter_sz <= 0)
2862                         return -EINVAL;
2863                 ib_spec->gre.size = sizeof(struct ib_flow_spec_gre);
2864                 memcpy(&ib_spec->gre.val, kern_spec_val, actual_filter_sz);
2865                 memcpy(&ib_spec->gre.mask, kern_spec_mask, actual_filter_sz);
2866                 break;
2867         case IB_FLOW_SPEC_MPLS:
2868                 ib_filter_sz = offsetof(struct ib_flow_mpls_filter, real_sz);
2869                 actual_filter_sz = spec_filter_size(kern_spec_mask,
2870                                                     kern_filter_sz,
2871                                                     ib_filter_sz);
2872                 if (actual_filter_sz <= 0)
2873                         return -EINVAL;
2874                 ib_spec->mpls.size = sizeof(struct ib_flow_spec_mpls);
2875                 memcpy(&ib_spec->mpls.val, kern_spec_val, actual_filter_sz);
2876                 memcpy(&ib_spec->mpls.mask, kern_spec_mask, actual_filter_sz);
2877                 break;
2878         default:
2879                 return -EINVAL;
2880         }
2881         return 0;
2882 }
2883
2884 static int kern_spec_to_ib_spec_filter(struct ib_uverbs_flow_spec *kern_spec,
2885                                        union ib_flow_spec *ib_spec)
2886 {
2887         ssize_t kern_filter_sz;
2888         void *kern_spec_mask;
2889         void *kern_spec_val;
2890
2891         kern_filter_sz = kern_spec_filter_sz(&kern_spec->hdr);
2892
2893         kern_spec_val = (void *)kern_spec +
2894                 sizeof(struct ib_uverbs_flow_spec_hdr);
2895         kern_spec_mask = kern_spec_val + kern_filter_sz;
2896
2897         return ib_uverbs_kern_spec_to_ib_spec_filter(kern_spec->type,
2898                                                      kern_spec_mask,
2899                                                      kern_spec_val,
2900                                                      kern_filter_sz, ib_spec);
2901 }
2902
2903 static int kern_spec_to_ib_spec(struct uverbs_attr_bundle *attrs,
2904                                 struct ib_uverbs_flow_spec *kern_spec,
2905                                 union ib_flow_spec *ib_spec,
2906                                 struct ib_uflow_resources *uflow_res)
2907 {
2908         if (kern_spec->reserved)
2909                 return -EINVAL;
2910
2911         if (kern_spec->type >= IB_FLOW_SPEC_ACTION_TAG)
2912                 return kern_spec_to_ib_spec_action(attrs, kern_spec, ib_spec,
2913                                                    uflow_res);
2914         else
2915                 return kern_spec_to_ib_spec_filter(kern_spec, ib_spec);
2916 }
2917
2918 static int ib_uverbs_ex_create_wq(struct uverbs_attr_bundle *attrs)
2919 {
2920         struct ib_uverbs_ex_create_wq cmd;
2921         struct ib_uverbs_ex_create_wq_resp resp = {};
2922         struct ib_uwq_object           *obj;
2923         int err = 0;
2924         struct ib_cq *cq;
2925         struct ib_pd *pd;
2926         struct ib_wq *wq;
2927         struct ib_wq_init_attr wq_init_attr = {};
2928         struct ib_device *ib_dev;
2929
2930         err = uverbs_request(attrs, &cmd, sizeof(cmd));
2931         if (err)
2932                 return err;
2933
2934         if (cmd.comp_mask)
2935                 return -EOPNOTSUPP;
2936
2937         obj = (struct ib_uwq_object *)uobj_alloc(UVERBS_OBJECT_WQ, attrs,
2938                                                  &ib_dev);
2939         if (IS_ERR(obj))
2940                 return PTR_ERR(obj);
2941
2942         pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs);
2943         if (!pd) {
2944                 err = -EINVAL;
2945                 goto err_uobj;
2946         }
2947
2948         cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
2949         if (!cq) {
2950                 err = -EINVAL;
2951                 goto err_put_pd;
2952         }
2953
2954         wq_init_attr.cq = cq;
2955         wq_init_attr.max_sge = cmd.max_sge;
2956         wq_init_attr.max_wr = cmd.max_wr;
2957         wq_init_attr.wq_context = attrs->ufile;
2958         wq_init_attr.wq_type = cmd.wq_type;
2959         wq_init_attr.event_handler = ib_uverbs_wq_event_handler;
2960         wq_init_attr.create_flags = cmd.create_flags;
2961         obj->uevent.events_reported = 0;
2962         INIT_LIST_HEAD(&obj->uevent.event_list);
2963
2964         wq = pd->device->create_wq(pd, &wq_init_attr, &attrs->driver_udata);
2965         if (IS_ERR(wq)) {
2966                 err = PTR_ERR(wq);
2967                 goto err_put_cq;
2968         }
2969
2970         wq->uobject = &obj->uevent.uobject;
2971         obj->uevent.uobject.object = wq;
2972         wq->wq_type = wq_init_attr.wq_type;
2973         wq->cq = cq;
2974         wq->pd = pd;
2975         wq->device = pd->device;
2976         wq->wq_context = wq_init_attr.wq_context;
2977         atomic_set(&wq->usecnt, 0);
2978         atomic_inc(&pd->usecnt);
2979         atomic_inc(&cq->usecnt);
2980         wq->uobject = &obj->uevent.uobject;
2981         obj->uevent.uobject.object = wq;
2982
2983         memset(&resp, 0, sizeof(resp));
2984         resp.wq_handle = obj->uevent.uobject.id;
2985         resp.max_sge = wq_init_attr.max_sge;
2986         resp.max_wr = wq_init_attr.max_wr;
2987         resp.wqn = wq->wq_num;
2988         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
2989         err = uverbs_response(attrs, &resp, sizeof(resp));
2990         if (err)
2991                 goto err_copy;
2992
2993         uobj_put_obj_read(pd);
2994         uobj_put_obj_read(cq);
2995         return uobj_alloc_commit(&obj->uevent.uobject);
2996
2997 err_copy:
2998         ib_destroy_wq(wq);
2999 err_put_cq:
3000         uobj_put_obj_read(cq);
3001 err_put_pd:
3002         uobj_put_obj_read(pd);
3003 err_uobj:
3004         uobj_alloc_abort(&obj->uevent.uobject);
3005
3006         return err;
3007 }
3008
3009 static int ib_uverbs_ex_destroy_wq(struct uverbs_attr_bundle *attrs)
3010 {
3011         struct ib_uverbs_ex_destroy_wq  cmd;
3012         struct ib_uverbs_ex_destroy_wq_resp     resp = {};
3013         struct ib_uobject               *uobj;
3014         struct ib_uwq_object            *obj;
3015         int                             ret;
3016
3017         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3018         if (ret)
3019                 return ret;
3020
3021         if (cmd.comp_mask)
3022                 return -EOPNOTSUPP;
3023
3024         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
3025         uobj = uobj_get_destroy(UVERBS_OBJECT_WQ, cmd.wq_handle, attrs);
3026         if (IS_ERR(uobj))
3027                 return PTR_ERR(uobj);
3028
3029         obj = container_of(uobj, struct ib_uwq_object, uevent.uobject);
3030         resp.events_reported = obj->uevent.events_reported;
3031
3032         uobj_put_destroy(uobj);
3033
3034         return uverbs_response(attrs, &resp, sizeof(resp));
3035 }
3036
3037 static int ib_uverbs_ex_modify_wq(struct uverbs_attr_bundle *attrs)
3038 {
3039         struct ib_uverbs_ex_modify_wq cmd;
3040         struct ib_wq *wq;
3041         struct ib_wq_attr wq_attr = {};
3042         int ret;
3043
3044         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3045         if (ret)
3046                 return ret;
3047
3048         if (!cmd.attr_mask)
3049                 return -EINVAL;
3050
3051         if (cmd.attr_mask > (IB_WQ_STATE | IB_WQ_CUR_STATE | IB_WQ_FLAGS))
3052                 return -EINVAL;
3053
3054         wq = uobj_get_obj_read(wq, UVERBS_OBJECT_WQ, cmd.wq_handle, attrs);
3055         if (!wq)
3056                 return -EINVAL;
3057
3058         wq_attr.curr_wq_state = cmd.curr_wq_state;
3059         wq_attr.wq_state = cmd.wq_state;
3060         if (cmd.attr_mask & IB_WQ_FLAGS) {
3061                 wq_attr.flags = cmd.flags;
3062                 wq_attr.flags_mask = cmd.flags_mask;
3063         }
3064         ret = wq->device->modify_wq(wq, &wq_attr, cmd.attr_mask,
3065                                     &attrs->driver_udata);
3066         uobj_put_obj_read(wq);
3067         return ret;
3068 }
3069
3070 static int ib_uverbs_ex_create_rwq_ind_table(struct uverbs_attr_bundle *attrs)
3071 {
3072         struct ib_uverbs_ex_create_rwq_ind_table cmd;
3073         struct ib_uverbs_ex_create_rwq_ind_table_resp  resp = {};
3074         struct ib_uobject                 *uobj;
3075         int err;
3076         struct ib_rwq_ind_table_init_attr init_attr = {};
3077         struct ib_rwq_ind_table *rwq_ind_tbl;
3078         struct ib_wq    **wqs = NULL;
3079         u32 *wqs_handles = NULL;
3080         struct ib_wq    *wq = NULL;
3081         int i, j, num_read_wqs;
3082         u32 num_wq_handles;
3083         struct uverbs_req_iter iter;
3084         struct ib_device *ib_dev;
3085
3086         err = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd));
3087         if (err)
3088                 return err;
3089
3090         if (cmd.comp_mask)
3091                 return -EOPNOTSUPP;
3092
3093         if (cmd.log_ind_tbl_size > IB_USER_VERBS_MAX_LOG_IND_TBL_SIZE)
3094                 return -EINVAL;
3095
3096         num_wq_handles = 1 << cmd.log_ind_tbl_size;
3097         wqs_handles = kcalloc(num_wq_handles, sizeof(*wqs_handles),
3098                               GFP_KERNEL);
3099         if (!wqs_handles)
3100                 return -ENOMEM;
3101
3102         err = uverbs_request_next(&iter, wqs_handles,
3103                                   num_wq_handles * sizeof(__u32));
3104         if (err)
3105                 goto err_free;
3106
3107         err = uverbs_request_finish(&iter);
3108         if (err)
3109                 goto err_free;
3110
3111         wqs = kcalloc(num_wq_handles, sizeof(*wqs), GFP_KERNEL);
3112         if (!wqs) {
3113                 err = -ENOMEM;
3114                 goto  err_free;
3115         }
3116
3117         for (num_read_wqs = 0; num_read_wqs < num_wq_handles;
3118                         num_read_wqs++) {
3119                 wq = uobj_get_obj_read(wq, UVERBS_OBJECT_WQ,
3120                                        wqs_handles[num_read_wqs], attrs);
3121                 if (!wq) {
3122                         err = -EINVAL;
3123                         goto put_wqs;
3124                 }
3125
3126                 wqs[num_read_wqs] = wq;
3127         }
3128
3129         uobj = uobj_alloc(UVERBS_OBJECT_RWQ_IND_TBL, attrs, &ib_dev);
3130         if (IS_ERR(uobj)) {
3131                 err = PTR_ERR(uobj);
3132                 goto put_wqs;
3133         }
3134
3135         init_attr.log_ind_tbl_size = cmd.log_ind_tbl_size;
3136         init_attr.ind_tbl = wqs;
3137
3138         rwq_ind_tbl = ib_dev->create_rwq_ind_table(ib_dev, &init_attr,
3139                                                    &attrs->driver_udata);
3140
3141         if (IS_ERR(rwq_ind_tbl)) {
3142                 err = PTR_ERR(rwq_ind_tbl);
3143                 goto err_uobj;
3144         }
3145
3146         rwq_ind_tbl->ind_tbl = wqs;
3147         rwq_ind_tbl->log_ind_tbl_size = init_attr.log_ind_tbl_size;
3148         rwq_ind_tbl->uobject = uobj;
3149         uobj->object = rwq_ind_tbl;
3150         rwq_ind_tbl->device = ib_dev;
3151         atomic_set(&rwq_ind_tbl->usecnt, 0);
3152
3153         for (i = 0; i < num_wq_handles; i++)
3154                 atomic_inc(&wqs[i]->usecnt);
3155
3156         resp.ind_tbl_handle = uobj->id;
3157         resp.ind_tbl_num = rwq_ind_tbl->ind_tbl_num;
3158         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
3159
3160         err = uverbs_response(attrs, &resp, sizeof(resp));
3161         if (err)
3162                 goto err_copy;
3163
3164         kfree(wqs_handles);
3165
3166         for (j = 0; j < num_read_wqs; j++)
3167                 uobj_put_obj_read(wqs[j]);
3168
3169         return uobj_alloc_commit(uobj);
3170
3171 err_copy:
3172         ib_destroy_rwq_ind_table(rwq_ind_tbl);
3173 err_uobj:
3174         uobj_alloc_abort(uobj);
3175 put_wqs:
3176         for (j = 0; j < num_read_wqs; j++)
3177                 uobj_put_obj_read(wqs[j]);
3178 err_free:
3179         kfree(wqs_handles);
3180         kfree(wqs);
3181         return err;
3182 }
3183
3184 static int ib_uverbs_ex_destroy_rwq_ind_table(struct uverbs_attr_bundle *attrs)
3185 {
3186         struct ib_uverbs_ex_destroy_rwq_ind_table cmd;
3187         int ret;
3188
3189         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3190         if (ret)
3191                 return ret;
3192
3193         if (cmd.comp_mask)
3194                 return -EOPNOTSUPP;
3195
3196         return uobj_perform_destroy(UVERBS_OBJECT_RWQ_IND_TBL,
3197                                     cmd.ind_tbl_handle, attrs);
3198 }
3199
3200 static int ib_uverbs_ex_create_flow(struct uverbs_attr_bundle *attrs)
3201 {
3202         struct ib_uverbs_create_flow      cmd;
3203         struct ib_uverbs_create_flow_resp resp;
3204         struct ib_uobject                 *uobj;
3205         struct ib_flow                    *flow_id;
3206         struct ib_uverbs_flow_attr        *kern_flow_attr;
3207         struct ib_flow_attr               *flow_attr;
3208         struct ib_qp                      *qp;
3209         struct ib_uflow_resources         *uflow_res;
3210         struct ib_uverbs_flow_spec_hdr    *kern_spec;
3211         struct uverbs_req_iter iter;
3212         int err;
3213         void *ib_spec;
3214         int i;
3215         struct ib_device *ib_dev;
3216
3217         err = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd));
3218         if (err)
3219                 return err;
3220
3221         if (cmd.comp_mask)
3222                 return -EINVAL;
3223
3224         if (!capable(CAP_NET_RAW))
3225                 return -EPERM;
3226
3227         if (cmd.flow_attr.flags >= IB_FLOW_ATTR_FLAGS_RESERVED)
3228                 return -EINVAL;
3229
3230         if ((cmd.flow_attr.flags & IB_FLOW_ATTR_FLAGS_DONT_TRAP) &&
3231             ((cmd.flow_attr.type == IB_FLOW_ATTR_ALL_DEFAULT) ||
3232              (cmd.flow_attr.type == IB_FLOW_ATTR_MC_DEFAULT)))
3233                 return -EINVAL;
3234
3235         if (cmd.flow_attr.num_of_specs > IB_FLOW_SPEC_SUPPORT_LAYERS)
3236                 return -EINVAL;
3237
3238         if (cmd.flow_attr.size >
3239             (cmd.flow_attr.num_of_specs * sizeof(struct ib_uverbs_flow_spec)))
3240                 return -EINVAL;
3241
3242         if (cmd.flow_attr.reserved[0] ||
3243             cmd.flow_attr.reserved[1])
3244                 return -EINVAL;
3245
3246         if (cmd.flow_attr.num_of_specs) {
3247                 kern_flow_attr = kmalloc(sizeof(*kern_flow_attr) + cmd.flow_attr.size,
3248                                          GFP_KERNEL);
3249                 if (!kern_flow_attr)
3250                         return -ENOMEM;
3251
3252                 *kern_flow_attr = cmd.flow_attr;
3253                 err = uverbs_request_next(&iter, &kern_flow_attr->flow_specs,
3254                                           cmd.flow_attr.size);
3255                 if (err)
3256                         goto err_free_attr;
3257         } else {
3258                 kern_flow_attr = &cmd.flow_attr;
3259         }
3260
3261         err = uverbs_request_finish(&iter);
3262         if (err)
3263                 goto err_free_attr;
3264
3265         uobj = uobj_alloc(UVERBS_OBJECT_FLOW, attrs, &ib_dev);
3266         if (IS_ERR(uobj)) {
3267                 err = PTR_ERR(uobj);
3268                 goto err_free_attr;
3269         }
3270
3271         qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs);
3272         if (!qp) {
3273                 err = -EINVAL;
3274                 goto err_uobj;
3275         }
3276
3277         if (qp->qp_type != IB_QPT_UD && qp->qp_type != IB_QPT_RAW_PACKET) {
3278                 err = -EINVAL;
3279                 goto err_put;
3280         }
3281
3282         flow_attr = kzalloc(struct_size(flow_attr, flows,
3283                                 cmd.flow_attr.num_of_specs), GFP_KERNEL);
3284         if (!flow_attr) {
3285                 err = -ENOMEM;
3286                 goto err_put;
3287         }
3288         uflow_res = flow_resources_alloc(cmd.flow_attr.num_of_specs);
3289         if (!uflow_res) {
3290                 err = -ENOMEM;
3291                 goto err_free_flow_attr;
3292         }
3293
3294         flow_attr->type = kern_flow_attr->type;
3295         flow_attr->priority = kern_flow_attr->priority;
3296         flow_attr->num_of_specs = kern_flow_attr->num_of_specs;
3297         flow_attr->port = kern_flow_attr->port;
3298         flow_attr->flags = kern_flow_attr->flags;
3299         flow_attr->size = sizeof(*flow_attr);
3300
3301         kern_spec = kern_flow_attr->flow_specs;
3302         ib_spec = flow_attr + 1;
3303         for (i = 0; i < flow_attr->num_of_specs &&
3304                         cmd.flow_attr.size >= sizeof(*kern_spec) &&
3305                         cmd.flow_attr.size >= kern_spec->size;
3306              i++) {
3307                 err = kern_spec_to_ib_spec(
3308                                 attrs, (struct ib_uverbs_flow_spec *)kern_spec,
3309                                 ib_spec, uflow_res);
3310                 if (err)
3311                         goto err_free;
3312
3313                 flow_attr->size +=
3314                         ((union ib_flow_spec *) ib_spec)->size;
3315                 cmd.flow_attr.size -= kern_spec->size;
3316                 kern_spec = ((void *)kern_spec) + kern_spec->size;
3317                 ib_spec += ((union ib_flow_spec *) ib_spec)->size;
3318         }
3319         if (cmd.flow_attr.size || (i != flow_attr->num_of_specs)) {
3320                 pr_warn("create flow failed, flow %d: %d bytes left from uverb cmd\n",
3321                         i, cmd.flow_attr.size);
3322                 err = -EINVAL;
3323                 goto err_free;
3324         }
3325
3326         flow_id = qp->device->create_flow(qp, flow_attr, IB_FLOW_DOMAIN_USER,
3327                                           &attrs->driver_udata);
3328
3329         if (IS_ERR(flow_id)) {
3330                 err = PTR_ERR(flow_id);
3331                 goto err_free;
3332         }
3333
3334         ib_set_flow(uobj, flow_id, qp, qp->device, uflow_res);
3335
3336         memset(&resp, 0, sizeof(resp));
3337         resp.flow_handle = uobj->id;
3338
3339         err = uverbs_response(attrs, &resp, sizeof(resp));
3340         if (err)
3341                 goto err_copy;
3342
3343         uobj_put_obj_read(qp);
3344         kfree(flow_attr);
3345         if (cmd.flow_attr.num_of_specs)
3346                 kfree(kern_flow_attr);
3347         return uobj_alloc_commit(uobj);
3348 err_copy:
3349         if (!qp->device->destroy_flow(flow_id))
3350                 atomic_dec(&qp->usecnt);
3351 err_free:
3352         ib_uverbs_flow_resources_free(uflow_res);
3353 err_free_flow_attr:
3354         kfree(flow_attr);
3355 err_put:
3356         uobj_put_obj_read(qp);
3357 err_uobj:
3358         uobj_alloc_abort(uobj);
3359 err_free_attr:
3360         if (cmd.flow_attr.num_of_specs)
3361                 kfree(kern_flow_attr);
3362         return err;
3363 }
3364
3365 static int ib_uverbs_ex_destroy_flow(struct uverbs_attr_bundle *attrs)
3366 {
3367         struct ib_uverbs_destroy_flow   cmd;
3368         int                             ret;
3369
3370         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3371         if (ret)
3372                 return ret;
3373
3374         if (cmd.comp_mask)
3375                 return -EINVAL;
3376
3377         return uobj_perform_destroy(UVERBS_OBJECT_FLOW, cmd.flow_handle, attrs);
3378 }
3379
3380 static int __uverbs_create_xsrq(struct uverbs_attr_bundle *attrs,
3381                                 struct ib_uverbs_create_xsrq *cmd,
3382                                 struct ib_udata *udata)
3383 {
3384         struct ib_uverbs_create_srq_resp resp;
3385         struct ib_usrq_object           *obj;
3386         struct ib_pd                    *pd;
3387         struct ib_srq                   *srq;
3388         struct ib_uobject               *uninitialized_var(xrcd_uobj);
3389         struct ib_srq_init_attr          attr;
3390         int ret;
3391         struct ib_device *ib_dev;
3392
3393         obj = (struct ib_usrq_object *)uobj_alloc(UVERBS_OBJECT_SRQ, attrs,
3394                                                   &ib_dev);
3395         if (IS_ERR(obj))
3396                 return PTR_ERR(obj);
3397
3398         if (cmd->srq_type == IB_SRQT_TM)
3399                 attr.ext.tag_matching.max_num_tags = cmd->max_num_tags;
3400
3401         if (cmd->srq_type == IB_SRQT_XRC) {
3402                 xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd->xrcd_handle,
3403                                           attrs);
3404                 if (IS_ERR(xrcd_uobj)) {
3405                         ret = -EINVAL;
3406                         goto err;
3407                 }
3408
3409                 attr.ext.xrc.xrcd = (struct ib_xrcd *)xrcd_uobj->object;
3410                 if (!attr.ext.xrc.xrcd) {
3411                         ret = -EINVAL;
3412                         goto err_put_xrcd;
3413                 }
3414
3415                 obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object, uobject);
3416                 atomic_inc(&obj->uxrcd->refcnt);
3417         }
3418
3419         if (ib_srq_has_cq(cmd->srq_type)) {
3420                 attr.ext.cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ,
3421                                                 cmd->cq_handle, attrs);
3422                 if (!attr.ext.cq) {
3423                         ret = -EINVAL;
3424                         goto err_put_xrcd;
3425                 }
3426         }
3427
3428         pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd->pd_handle, attrs);
3429         if (!pd) {
3430                 ret = -EINVAL;
3431                 goto err_put_cq;
3432         }
3433
3434         attr.event_handler  = ib_uverbs_srq_event_handler;
3435         attr.srq_context    = attrs->ufile;
3436         attr.srq_type       = cmd->srq_type;
3437         attr.attr.max_wr    = cmd->max_wr;
3438         attr.attr.max_sge   = cmd->max_sge;
3439         attr.attr.srq_limit = cmd->srq_limit;
3440
3441         obj->uevent.events_reported = 0;
3442         INIT_LIST_HEAD(&obj->uevent.event_list);
3443
3444         srq = pd->device->create_srq(pd, &attr, udata);
3445         if (IS_ERR(srq)) {
3446                 ret = PTR_ERR(srq);
3447                 goto err_put;
3448         }
3449
3450         srq->device        = pd->device;
3451         srq->pd            = pd;
3452         srq->srq_type      = cmd->srq_type;
3453         srq->uobject       = &obj->uevent.uobject;
3454         srq->event_handler = attr.event_handler;
3455         srq->srq_context   = attr.srq_context;
3456
3457         if (ib_srq_has_cq(cmd->srq_type)) {
3458                 srq->ext.cq       = attr.ext.cq;
3459                 atomic_inc(&attr.ext.cq->usecnt);
3460         }
3461
3462         if (cmd->srq_type == IB_SRQT_XRC) {
3463                 srq->ext.xrc.xrcd = attr.ext.xrc.xrcd;
3464                 atomic_inc(&attr.ext.xrc.xrcd->usecnt);
3465         }
3466
3467         atomic_inc(&pd->usecnt);
3468         atomic_set(&srq->usecnt, 0);
3469
3470         obj->uevent.uobject.object = srq;
3471         obj->uevent.uobject.user_handle = cmd->user_handle;
3472
3473         memset(&resp, 0, sizeof resp);
3474         resp.srq_handle = obj->uevent.uobject.id;
3475         resp.max_wr     = attr.attr.max_wr;
3476         resp.max_sge    = attr.attr.max_sge;
3477         if (cmd->srq_type == IB_SRQT_XRC)
3478                 resp.srqn = srq->ext.xrc.srq_num;
3479
3480         ret = uverbs_response(attrs, &resp, sizeof(resp));
3481         if (ret)
3482                 goto err_copy;
3483
3484         if (cmd->srq_type == IB_SRQT_XRC)
3485                 uobj_put_read(xrcd_uobj);
3486
3487         if (ib_srq_has_cq(cmd->srq_type))
3488                 uobj_put_obj_read(attr.ext.cq);
3489
3490         uobj_put_obj_read(pd);
3491         return uobj_alloc_commit(&obj->uevent.uobject);
3492
3493 err_copy:
3494         ib_destroy_srq(srq);
3495
3496 err_put:
3497         uobj_put_obj_read(pd);
3498
3499 err_put_cq:
3500         if (ib_srq_has_cq(cmd->srq_type))
3501                 uobj_put_obj_read(attr.ext.cq);
3502
3503 err_put_xrcd:
3504         if (cmd->srq_type == IB_SRQT_XRC) {
3505                 atomic_dec(&obj->uxrcd->refcnt);
3506                 uobj_put_read(xrcd_uobj);
3507         }
3508
3509 err:
3510         uobj_alloc_abort(&obj->uevent.uobject);
3511         return ret;
3512 }
3513
3514 static int ib_uverbs_create_srq(struct uverbs_attr_bundle *attrs)
3515 {
3516         struct ib_uverbs_create_srq      cmd;
3517         struct ib_uverbs_create_xsrq     xcmd;
3518         int ret;
3519
3520         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3521         if (ret)
3522                 return ret;
3523
3524         memset(&xcmd, 0, sizeof(xcmd));
3525         xcmd.response    = cmd.response;
3526         xcmd.user_handle = cmd.user_handle;
3527         xcmd.srq_type    = IB_SRQT_BASIC;
3528         xcmd.pd_handle   = cmd.pd_handle;
3529         xcmd.max_wr      = cmd.max_wr;
3530         xcmd.max_sge     = cmd.max_sge;
3531         xcmd.srq_limit   = cmd.srq_limit;
3532
3533         return __uverbs_create_xsrq(attrs, &xcmd, &attrs->driver_udata);
3534 }
3535
3536 static int ib_uverbs_create_xsrq(struct uverbs_attr_bundle *attrs)
3537 {
3538         struct ib_uverbs_create_xsrq     cmd;
3539         int ret;
3540
3541         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3542         if (ret)
3543                 return ret;
3544
3545         return __uverbs_create_xsrq(attrs, &cmd, &attrs->driver_udata);
3546 }
3547
3548 static int ib_uverbs_modify_srq(struct uverbs_attr_bundle *attrs)
3549 {
3550         struct ib_uverbs_modify_srq cmd;
3551         struct ib_srq              *srq;
3552         struct ib_srq_attr          attr;
3553         int                         ret;
3554
3555         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3556         if (ret)
3557                 return ret;
3558
3559         srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs);
3560         if (!srq)
3561                 return -EINVAL;
3562
3563         attr.max_wr    = cmd.max_wr;
3564         attr.srq_limit = cmd.srq_limit;
3565
3566         ret = srq->device->modify_srq(srq, &attr, cmd.attr_mask,
3567                                       &attrs->driver_udata);
3568
3569         uobj_put_obj_read(srq);
3570
3571         return ret;
3572 }
3573
3574 static int ib_uverbs_query_srq(struct uverbs_attr_bundle *attrs)
3575 {
3576         struct ib_uverbs_query_srq      cmd;
3577         struct ib_uverbs_query_srq_resp resp;
3578         struct ib_srq_attr              attr;
3579         struct ib_srq                   *srq;
3580         int                             ret;
3581
3582         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3583         if (ret)
3584                 return ret;
3585
3586         srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs);
3587         if (!srq)
3588                 return -EINVAL;
3589
3590         ret = ib_query_srq(srq, &attr);
3591
3592         uobj_put_obj_read(srq);
3593
3594         if (ret)
3595                 return ret;
3596
3597         memset(&resp, 0, sizeof resp);
3598
3599         resp.max_wr    = attr.max_wr;
3600         resp.max_sge   = attr.max_sge;
3601         resp.srq_limit = attr.srq_limit;
3602
3603         return uverbs_response(attrs, &resp, sizeof(resp));
3604 }
3605
3606 static int ib_uverbs_destroy_srq(struct uverbs_attr_bundle *attrs)
3607 {
3608         struct ib_uverbs_destroy_srq      cmd;
3609         struct ib_uverbs_destroy_srq_resp resp;
3610         struct ib_uobject                *uobj;
3611         struct ib_uevent_object          *obj;
3612         int ret;
3613
3614         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3615         if (ret)
3616                 return ret;
3617
3618         uobj = uobj_get_destroy(UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs);
3619         if (IS_ERR(uobj))
3620                 return PTR_ERR(uobj);
3621
3622         obj = container_of(uobj, struct ib_uevent_object, uobject);
3623         memset(&resp, 0, sizeof(resp));
3624         resp.events_reported = obj->events_reported;
3625
3626         uobj_put_destroy(uobj);
3627
3628         return uverbs_response(attrs, &resp, sizeof(resp));
3629 }
3630
3631 static int ib_uverbs_ex_query_device(struct uverbs_attr_bundle *attrs)
3632 {
3633         struct ib_uverbs_ex_query_device_resp resp = {};
3634         struct ib_uverbs_ex_query_device  cmd;
3635         struct ib_device_attr attr = {0};
3636         struct ib_ucontext *ucontext;
3637         struct ib_device *ib_dev;
3638         int err;
3639
3640         ucontext = ib_uverbs_get_ucontext(attrs);
3641         if (IS_ERR(ucontext))
3642                 return PTR_ERR(ucontext);
3643         ib_dev = ucontext->device;
3644
3645         err = uverbs_request(attrs, &cmd, sizeof(cmd));
3646         if (err)
3647                 return err;
3648
3649         if (cmd.comp_mask)
3650                 return -EINVAL;
3651
3652         if (cmd.reserved)
3653                 return -EINVAL;
3654
3655         err = ib_dev->query_device(ib_dev, &attr, &attrs->driver_udata);
3656         if (err)
3657                 return err;
3658
3659         copy_query_dev_fields(ucontext, &resp.base, &attr);
3660
3661 #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
3662         resp.odp_caps.general_caps = attr.odp_caps.general_caps;
3663         resp.odp_caps.per_transport_caps.rc_odp_caps =
3664                 attr.odp_caps.per_transport_caps.rc_odp_caps;
3665         resp.odp_caps.per_transport_caps.uc_odp_caps =
3666                 attr.odp_caps.per_transport_caps.uc_odp_caps;
3667         resp.odp_caps.per_transport_caps.ud_odp_caps =
3668                 attr.odp_caps.per_transport_caps.ud_odp_caps;
3669 #endif
3670
3671         resp.timestamp_mask = attr.timestamp_mask;
3672         resp.hca_core_clock = attr.hca_core_clock;
3673         resp.device_cap_flags_ex = attr.device_cap_flags;
3674         resp.rss_caps.supported_qpts = attr.rss_caps.supported_qpts;
3675         resp.rss_caps.max_rwq_indirection_tables =
3676                 attr.rss_caps.max_rwq_indirection_tables;
3677         resp.rss_caps.max_rwq_indirection_table_size =
3678                 attr.rss_caps.max_rwq_indirection_table_size;
3679         resp.max_wq_type_rq = attr.max_wq_type_rq;
3680         resp.raw_packet_caps = attr.raw_packet_caps;
3681         resp.tm_caps.max_rndv_hdr_size  = attr.tm_caps.max_rndv_hdr_size;
3682         resp.tm_caps.max_num_tags       = attr.tm_caps.max_num_tags;
3683         resp.tm_caps.max_ops            = attr.tm_caps.max_ops;
3684         resp.tm_caps.max_sge            = attr.tm_caps.max_sge;
3685         resp.tm_caps.flags              = attr.tm_caps.flags;
3686         resp.cq_moderation_caps.max_cq_moderation_count  =
3687                 attr.cq_caps.max_cq_moderation_count;
3688         resp.cq_moderation_caps.max_cq_moderation_period =
3689                 attr.cq_caps.max_cq_moderation_period;
3690         resp.max_dm_size = attr.max_dm_size;
3691         resp.response_length = uverbs_response_length(attrs, sizeof(resp));
3692
3693         return uverbs_response(attrs, &resp, sizeof(resp));
3694 }
3695
3696 static int ib_uverbs_ex_modify_cq(struct uverbs_attr_bundle *attrs)
3697 {
3698         struct ib_uverbs_ex_modify_cq cmd;
3699         struct ib_cq *cq;
3700         int ret;
3701
3702         ret = uverbs_request(attrs, &cmd, sizeof(cmd));
3703         if (ret)
3704                 return ret;
3705
3706         if (!cmd.attr_mask || cmd.reserved)
3707                 return -EINVAL;
3708
3709         if (cmd.attr_mask > IB_CQ_MODERATE)
3710                 return -EOPNOTSUPP;
3711
3712         cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs);
3713         if (!cq)
3714                 return -EINVAL;
3715
3716         ret = rdma_set_cq_moderation(cq, cmd.attr.cq_count, cmd.attr.cq_period);
3717
3718         uobj_put_obj_read(cq);
3719
3720         return ret;
3721 }
3722
3723 /*
3724  * Describe the input structs for write(). Some write methods have an input
3725  * only struct, most have an input and output. If the struct has an output then
3726  * the 'response' u64 must be the first field in the request structure.
3727  *
3728  * If udata is present then both the request and response structs have a
3729  * trailing driver_data flex array. In this case the size of the base struct
3730  * cannot be changed.
3731  */
3732 #define offsetof_after(_struct, _member)                                       \
3733         (offsetof(_struct, _member) + sizeof(((_struct *)NULL)->_member))
3734
3735 #define UAPI_DEF_WRITE_IO(req, resp)                                           \
3736         .write.has_resp = 1 +                                                  \
3737                           BUILD_BUG_ON_ZERO(offsetof(req, response) != 0) +    \
3738                           BUILD_BUG_ON_ZERO(sizeof(((req *)0)->response) !=    \
3739                                             sizeof(u64)),                      \
3740         .write.req_size = sizeof(req), .write.resp_size = sizeof(resp)
3741
3742 #define UAPI_DEF_WRITE_I(req) .write.req_size = sizeof(req)
3743
3744 #define UAPI_DEF_WRITE_UDATA_IO(req, resp)                                     \
3745         UAPI_DEF_WRITE_IO(req, resp),                                          \
3746                 .write.has_udata =                                             \
3747                         1 +                                                    \
3748                         BUILD_BUG_ON_ZERO(offsetof(req, driver_data) !=        \
3749                                           sizeof(req)) +                       \
3750                         BUILD_BUG_ON_ZERO(offsetof(resp, driver_data) !=       \
3751                                           sizeof(resp))
3752
3753 #define UAPI_DEF_WRITE_UDATA_I(req)                                            \
3754         UAPI_DEF_WRITE_I(req),                                                 \
3755                 .write.has_udata =                                             \
3756                         1 + BUILD_BUG_ON_ZERO(offsetof(req, driver_data) !=    \
3757                                               sizeof(req))
3758
3759 /*
3760  * The _EX versions are for use with WRITE_EX and allow the last struct member
3761  * to be specified. Buffers that do not include that member will be rejected.
3762  */
3763 #define UAPI_DEF_WRITE_IO_EX(req, req_last_member, resp, resp_last_member)     \
3764         .write.has_resp = 1,                                                   \
3765         .write.req_size = offsetof_after(req, req_last_member),                \
3766         .write.resp_size = offsetof_after(resp, resp_last_member)
3767
3768 #define UAPI_DEF_WRITE_I_EX(req, req_last_member)                              \
3769         .write.req_size = offsetof_after(req, req_last_member)
3770
3771 const struct uapi_definition uverbs_def_write_intf[] = {
3772         DECLARE_UVERBS_OBJECT(
3773                 UVERBS_OBJECT_AH,
3774                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_AH,
3775                                      ib_uverbs_create_ah,
3776                                      UAPI_DEF_WRITE_UDATA_IO(
3777                                              struct ib_uverbs_create_ah,
3778                                              struct ib_uverbs_create_ah_resp),
3779                                      UAPI_DEF_METHOD_NEEDS_FN(create_ah)),
3780                 DECLARE_UVERBS_WRITE(
3781                         IB_USER_VERBS_CMD_DESTROY_AH,
3782                         ib_uverbs_destroy_ah,
3783                         UAPI_DEF_WRITE_I(struct ib_uverbs_destroy_ah),
3784                         UAPI_DEF_METHOD_NEEDS_FN(destroy_ah))),
3785
3786         DECLARE_UVERBS_OBJECT(
3787                 UVERBS_OBJECT_COMP_CHANNEL,
3788                 DECLARE_UVERBS_WRITE(
3789                         IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL,
3790                         ib_uverbs_create_comp_channel,
3791                         UAPI_DEF_WRITE_IO(
3792                                 struct ib_uverbs_create_comp_channel,
3793                                 struct ib_uverbs_create_comp_channel_resp))),
3794
3795         DECLARE_UVERBS_OBJECT(
3796                 UVERBS_OBJECT_CQ,
3797                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_CQ,
3798                                      ib_uverbs_create_cq,
3799                                      UAPI_DEF_WRITE_UDATA_IO(
3800                                              struct ib_uverbs_create_cq,
3801                                              struct ib_uverbs_create_cq_resp),
3802                                      UAPI_DEF_METHOD_NEEDS_FN(create_cq)),
3803                 DECLARE_UVERBS_WRITE(
3804                         IB_USER_VERBS_CMD_DESTROY_CQ,
3805                         ib_uverbs_destroy_cq,
3806                         UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_cq,
3807                                           struct ib_uverbs_destroy_cq_resp),
3808                         UAPI_DEF_METHOD_NEEDS_FN(destroy_cq)),
3809                 DECLARE_UVERBS_WRITE(
3810                         IB_USER_VERBS_CMD_POLL_CQ,
3811                         ib_uverbs_poll_cq,
3812                         UAPI_DEF_WRITE_IO(struct ib_uverbs_poll_cq,
3813                                           struct ib_uverbs_poll_cq_resp),
3814                         UAPI_DEF_METHOD_NEEDS_FN(poll_cq)),
3815                 DECLARE_UVERBS_WRITE(
3816                         IB_USER_VERBS_CMD_REQ_NOTIFY_CQ,
3817                         ib_uverbs_req_notify_cq,
3818                         UAPI_DEF_WRITE_I(struct ib_uverbs_req_notify_cq),
3819                         UAPI_DEF_METHOD_NEEDS_FN(req_notify_cq)),
3820                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_RESIZE_CQ,
3821                                      ib_uverbs_resize_cq,
3822                                      UAPI_DEF_WRITE_UDATA_IO(
3823                                              struct ib_uverbs_resize_cq,
3824                                              struct ib_uverbs_resize_cq_resp),
3825                                      UAPI_DEF_METHOD_NEEDS_FN(resize_cq)),
3826                 DECLARE_UVERBS_WRITE_EX(
3827                         IB_USER_VERBS_EX_CMD_CREATE_CQ,
3828                         ib_uverbs_ex_create_cq,
3829                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_cq,
3830                                              reserved,
3831                                              struct ib_uverbs_ex_create_cq_resp,
3832                                              response_length),
3833                         UAPI_DEF_METHOD_NEEDS_FN(create_cq)),
3834                 DECLARE_UVERBS_WRITE_EX(
3835                         IB_USER_VERBS_EX_CMD_MODIFY_CQ,
3836                         ib_uverbs_ex_modify_cq,
3837                         UAPI_DEF_WRITE_I(struct ib_uverbs_ex_modify_cq),
3838                         UAPI_DEF_METHOD_NEEDS_FN(create_cq))),
3839
3840         DECLARE_UVERBS_OBJECT(
3841                 UVERBS_OBJECT_DEVICE,
3842                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_GET_CONTEXT,
3843                                      ib_uverbs_get_context,
3844                                      UAPI_DEF_WRITE_UDATA_IO(
3845                                              struct ib_uverbs_get_context,
3846                                              struct ib_uverbs_get_context_resp)),
3847                 DECLARE_UVERBS_WRITE(
3848                         IB_USER_VERBS_CMD_QUERY_DEVICE,
3849                         ib_uverbs_query_device,
3850                         UAPI_DEF_WRITE_IO(struct ib_uverbs_query_device,
3851                                           struct ib_uverbs_query_device_resp)),
3852                 DECLARE_UVERBS_WRITE(
3853                         IB_USER_VERBS_CMD_QUERY_PORT,
3854                         ib_uverbs_query_port,
3855                         UAPI_DEF_WRITE_IO(struct ib_uverbs_query_port,
3856                                           struct ib_uverbs_query_port_resp),
3857                         UAPI_DEF_METHOD_NEEDS_FN(query_port)),
3858                 DECLARE_UVERBS_WRITE_EX(
3859                         IB_USER_VERBS_EX_CMD_QUERY_DEVICE,
3860                         ib_uverbs_ex_query_device,
3861                         UAPI_DEF_WRITE_IO_EX(
3862                                 struct ib_uverbs_ex_query_device,
3863                                 reserved,
3864                                 struct ib_uverbs_ex_query_device_resp,
3865                                 response_length),
3866                         UAPI_DEF_METHOD_NEEDS_FN(query_device)),
3867                 UAPI_DEF_OBJ_NEEDS_FN(alloc_ucontext),
3868                 UAPI_DEF_OBJ_NEEDS_FN(dealloc_ucontext)),
3869
3870         DECLARE_UVERBS_OBJECT(
3871                 UVERBS_OBJECT_FLOW,
3872                 DECLARE_UVERBS_WRITE_EX(
3873                         IB_USER_VERBS_EX_CMD_CREATE_FLOW,
3874                         ib_uverbs_ex_create_flow,
3875                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_create_flow,
3876                                              flow_attr,
3877                                              struct ib_uverbs_create_flow_resp,
3878                                              flow_handle),
3879                         UAPI_DEF_METHOD_NEEDS_FN(create_flow)),
3880                 DECLARE_UVERBS_WRITE_EX(
3881                         IB_USER_VERBS_EX_CMD_DESTROY_FLOW,
3882                         ib_uverbs_ex_destroy_flow,
3883                         UAPI_DEF_WRITE_I(struct ib_uverbs_destroy_flow),
3884                         UAPI_DEF_METHOD_NEEDS_FN(destroy_flow))),
3885
3886         DECLARE_UVERBS_OBJECT(
3887                 UVERBS_OBJECT_MR,
3888                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_DEREG_MR,
3889                                      ib_uverbs_dereg_mr,
3890                                      UAPI_DEF_WRITE_I(struct ib_uverbs_dereg_mr),
3891                                      UAPI_DEF_METHOD_NEEDS_FN(dereg_mr)),
3892                 DECLARE_UVERBS_WRITE(
3893                         IB_USER_VERBS_CMD_REG_MR,
3894                         ib_uverbs_reg_mr,
3895                         UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_reg_mr,
3896                                                 struct ib_uverbs_reg_mr_resp),
3897                         UAPI_DEF_METHOD_NEEDS_FN(reg_user_mr)),
3898                 DECLARE_UVERBS_WRITE(
3899                         IB_USER_VERBS_CMD_REREG_MR,
3900                         ib_uverbs_rereg_mr,
3901                         UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_rereg_mr,
3902                                                 struct ib_uverbs_rereg_mr_resp),
3903                         UAPI_DEF_METHOD_NEEDS_FN(rereg_user_mr))),
3904
3905         DECLARE_UVERBS_OBJECT(
3906                 UVERBS_OBJECT_MW,
3907                 DECLARE_UVERBS_WRITE(
3908                         IB_USER_VERBS_CMD_ALLOC_MW,
3909                         ib_uverbs_alloc_mw,
3910                         UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_alloc_mw,
3911                                                 struct ib_uverbs_alloc_mw_resp),
3912                         UAPI_DEF_METHOD_NEEDS_FN(alloc_mw)),
3913                 DECLARE_UVERBS_WRITE(
3914                         IB_USER_VERBS_CMD_DEALLOC_MW,
3915                         ib_uverbs_dealloc_mw,
3916                         UAPI_DEF_WRITE_I(struct ib_uverbs_dealloc_mw),
3917                         UAPI_DEF_METHOD_NEEDS_FN(dealloc_mw))),
3918
3919         DECLARE_UVERBS_OBJECT(
3920                 UVERBS_OBJECT_PD,
3921                 DECLARE_UVERBS_WRITE(
3922                         IB_USER_VERBS_CMD_ALLOC_PD,
3923                         ib_uverbs_alloc_pd,
3924                         UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_alloc_pd,
3925                                                 struct ib_uverbs_alloc_pd_resp),
3926                         UAPI_DEF_METHOD_NEEDS_FN(alloc_pd)),
3927                 DECLARE_UVERBS_WRITE(
3928                         IB_USER_VERBS_CMD_DEALLOC_PD,
3929                         ib_uverbs_dealloc_pd,
3930                         UAPI_DEF_WRITE_I(struct ib_uverbs_dealloc_pd),
3931                         UAPI_DEF_METHOD_NEEDS_FN(dealloc_pd))),
3932
3933         DECLARE_UVERBS_OBJECT(
3934                 UVERBS_OBJECT_QP,
3935                 DECLARE_UVERBS_WRITE(
3936                         IB_USER_VERBS_CMD_ATTACH_MCAST,
3937                         ib_uverbs_attach_mcast,
3938                         UAPI_DEF_WRITE_I(struct ib_uverbs_attach_mcast),
3939                         UAPI_DEF_METHOD_NEEDS_FN(attach_mcast),
3940                         UAPI_DEF_METHOD_NEEDS_FN(detach_mcast)),
3941                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_QP,
3942                                      ib_uverbs_create_qp,
3943                                      UAPI_DEF_WRITE_UDATA_IO(
3944                                              struct ib_uverbs_create_qp,
3945                                              struct ib_uverbs_create_qp_resp),
3946                                      UAPI_DEF_METHOD_NEEDS_FN(create_qp)),
3947                 DECLARE_UVERBS_WRITE(
3948                         IB_USER_VERBS_CMD_DESTROY_QP,
3949                         ib_uverbs_destroy_qp,
3950                         UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_qp,
3951                                           struct ib_uverbs_destroy_qp_resp),
3952                         UAPI_DEF_METHOD_NEEDS_FN(destroy_qp)),
3953                 DECLARE_UVERBS_WRITE(
3954                         IB_USER_VERBS_CMD_DETACH_MCAST,
3955                         ib_uverbs_detach_mcast,
3956                         UAPI_DEF_WRITE_I(struct ib_uverbs_detach_mcast),
3957                         UAPI_DEF_METHOD_NEEDS_FN(detach_mcast)),
3958                 DECLARE_UVERBS_WRITE(
3959                         IB_USER_VERBS_CMD_MODIFY_QP,
3960                         ib_uverbs_modify_qp,
3961                         UAPI_DEF_WRITE_I(struct ib_uverbs_modify_qp),
3962                         UAPI_DEF_METHOD_NEEDS_FN(modify_qp)),
3963                 DECLARE_UVERBS_WRITE(
3964                         IB_USER_VERBS_CMD_POST_RECV,
3965                         ib_uverbs_post_recv,
3966                         UAPI_DEF_WRITE_IO(struct ib_uverbs_post_recv,
3967                                           struct ib_uverbs_post_recv_resp),
3968                         UAPI_DEF_METHOD_NEEDS_FN(post_recv)),
3969                 DECLARE_UVERBS_WRITE(
3970                         IB_USER_VERBS_CMD_POST_SEND,
3971                         ib_uverbs_post_send,
3972                         UAPI_DEF_WRITE_IO(struct ib_uverbs_post_send,
3973                                           struct ib_uverbs_post_send_resp),
3974                         UAPI_DEF_METHOD_NEEDS_FN(post_send)),
3975                 DECLARE_UVERBS_WRITE(
3976                         IB_USER_VERBS_CMD_QUERY_QP,
3977                         ib_uverbs_query_qp,
3978                         UAPI_DEF_WRITE_IO(struct ib_uverbs_query_qp,
3979                                           struct ib_uverbs_query_qp_resp),
3980                         UAPI_DEF_METHOD_NEEDS_FN(query_qp)),
3981                 DECLARE_UVERBS_WRITE_EX(
3982                         IB_USER_VERBS_EX_CMD_CREATE_QP,
3983                         ib_uverbs_ex_create_qp,
3984                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_qp,
3985                                              comp_mask,
3986                                              struct ib_uverbs_ex_create_qp_resp,
3987                                              response_length),
3988                         UAPI_DEF_METHOD_NEEDS_FN(create_qp)),
3989                 DECLARE_UVERBS_WRITE_EX(
3990                         IB_USER_VERBS_EX_CMD_MODIFY_QP,
3991                         ib_uverbs_ex_modify_qp,
3992                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_modify_qp,
3993                                              base,
3994                                              struct ib_uverbs_ex_modify_qp_resp,
3995                                              response_length),
3996                         UAPI_DEF_METHOD_NEEDS_FN(modify_qp))),
3997
3998         DECLARE_UVERBS_OBJECT(
3999                 UVERBS_OBJECT_RWQ_IND_TBL,
4000                 DECLARE_UVERBS_WRITE_EX(
4001                         IB_USER_VERBS_EX_CMD_CREATE_RWQ_IND_TBL,
4002                         ib_uverbs_ex_create_rwq_ind_table,
4003                         UAPI_DEF_WRITE_IO_EX(
4004                                 struct ib_uverbs_ex_create_rwq_ind_table,
4005                                 log_ind_tbl_size,
4006                                 struct ib_uverbs_ex_create_rwq_ind_table_resp,
4007                                 ind_tbl_num),
4008                         UAPI_DEF_METHOD_NEEDS_FN(create_rwq_ind_table)),
4009                 DECLARE_UVERBS_WRITE_EX(
4010                         IB_USER_VERBS_EX_CMD_DESTROY_RWQ_IND_TBL,
4011                         ib_uverbs_ex_destroy_rwq_ind_table,
4012                         UAPI_DEF_WRITE_I(
4013                                 struct ib_uverbs_ex_destroy_rwq_ind_table),
4014                         UAPI_DEF_METHOD_NEEDS_FN(destroy_rwq_ind_table))),
4015
4016         DECLARE_UVERBS_OBJECT(
4017                 UVERBS_OBJECT_WQ,
4018                 DECLARE_UVERBS_WRITE_EX(
4019                         IB_USER_VERBS_EX_CMD_CREATE_WQ,
4020                         ib_uverbs_ex_create_wq,
4021                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_wq,
4022                                              max_sge,
4023                                              struct ib_uverbs_ex_create_wq_resp,
4024                                              wqn),
4025                         UAPI_DEF_METHOD_NEEDS_FN(create_wq)),
4026                 DECLARE_UVERBS_WRITE_EX(
4027                         IB_USER_VERBS_EX_CMD_DESTROY_WQ,
4028                         ib_uverbs_ex_destroy_wq,
4029                         UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_destroy_wq,
4030                                              wq_handle,
4031                                              struct ib_uverbs_ex_destroy_wq_resp,
4032                                              reserved),
4033                         UAPI_DEF_METHOD_NEEDS_FN(destroy_wq)),
4034                 DECLARE_UVERBS_WRITE_EX(
4035                         IB_USER_VERBS_EX_CMD_MODIFY_WQ,
4036                         ib_uverbs_ex_modify_wq,
4037                         UAPI_DEF_WRITE_I_EX(struct ib_uverbs_ex_modify_wq,
4038                                             curr_wq_state),
4039                         UAPI_DEF_METHOD_NEEDS_FN(modify_wq))),
4040
4041         DECLARE_UVERBS_OBJECT(
4042                 UVERBS_OBJECT_SRQ,
4043                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_SRQ,
4044                                      ib_uverbs_create_srq,
4045                                      UAPI_DEF_WRITE_UDATA_IO(
4046                                              struct ib_uverbs_create_srq,
4047                                              struct ib_uverbs_create_srq_resp),
4048                                      UAPI_DEF_METHOD_NEEDS_FN(create_srq)),
4049                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_XSRQ,
4050                                      ib_uverbs_create_xsrq,
4051                                      UAPI_DEF_WRITE_UDATA_IO(
4052                                              struct ib_uverbs_create_xsrq,
4053                                              struct ib_uverbs_create_srq_resp),
4054                                      UAPI_DEF_METHOD_NEEDS_FN(create_srq)),
4055                 DECLARE_UVERBS_WRITE(
4056                         IB_USER_VERBS_CMD_DESTROY_SRQ,
4057                         ib_uverbs_destroy_srq,
4058                         UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_srq,
4059                                           struct ib_uverbs_destroy_srq_resp),
4060                         UAPI_DEF_METHOD_NEEDS_FN(destroy_srq)),
4061                 DECLARE_UVERBS_WRITE(
4062                         IB_USER_VERBS_CMD_MODIFY_SRQ,
4063                         ib_uverbs_modify_srq,
4064                         UAPI_DEF_WRITE_UDATA_I(struct ib_uverbs_modify_srq),
4065                         UAPI_DEF_METHOD_NEEDS_FN(modify_srq)),
4066                 DECLARE_UVERBS_WRITE(
4067                         IB_USER_VERBS_CMD_POST_SRQ_RECV,
4068                         ib_uverbs_post_srq_recv,
4069                         UAPI_DEF_WRITE_IO(struct ib_uverbs_post_srq_recv,
4070                                           struct ib_uverbs_post_srq_recv_resp),
4071                         UAPI_DEF_METHOD_NEEDS_FN(post_srq_recv)),
4072                 DECLARE_UVERBS_WRITE(
4073                         IB_USER_VERBS_CMD_QUERY_SRQ,
4074                         ib_uverbs_query_srq,
4075                         UAPI_DEF_WRITE_IO(struct ib_uverbs_query_srq,
4076                                           struct ib_uverbs_query_srq_resp),
4077                         UAPI_DEF_METHOD_NEEDS_FN(query_srq))),
4078
4079         DECLARE_UVERBS_OBJECT(
4080                 UVERBS_OBJECT_XRCD,
4081                 DECLARE_UVERBS_WRITE(
4082                         IB_USER_VERBS_CMD_CLOSE_XRCD,
4083                         ib_uverbs_close_xrcd,
4084                         UAPI_DEF_WRITE_I(struct ib_uverbs_close_xrcd),
4085                         UAPI_DEF_METHOD_NEEDS_FN(dealloc_xrcd)),
4086                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_OPEN_QP,
4087                                      ib_uverbs_open_qp,
4088                                      UAPI_DEF_WRITE_UDATA_IO(
4089                                              struct ib_uverbs_open_qp,
4090                                              struct ib_uverbs_create_qp_resp)),
4091                 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_OPEN_XRCD,
4092                                      ib_uverbs_open_xrcd,
4093                                      UAPI_DEF_WRITE_UDATA_IO(
4094                                              struct ib_uverbs_open_xrcd,
4095                                              struct ib_uverbs_open_xrcd_resp),
4096                                      UAPI_DEF_METHOD_NEEDS_FN(alloc_xrcd))),
4097
4098         {},
4099 };