IB/mthca: Make all device methods truly reentrant
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / drivers / infiniband / core / uverbs_main.c
CommitLineData
bc38a6ab
RD
1/*
2 * Copyright (c) 2005 Topspin Communications. All rights reserved.
33b9b3ee 3 * Copyright (c) 2005, 2006 Cisco Systems. All rights reserved.
2a1d9b7f
RD
4 * Copyright (c) 2005 Mellanox Technologies. All rights reserved.
5 * Copyright (c) 2005 Voltaire, Inc. All rights reserved.
67cdb40c 6 * Copyright (c) 2005 PathScale, Inc. All rights reserved.
bc38a6ab
RD
7 *
8 * This software is available to you under a choice of one of two
9 * licenses. You may choose to be licensed under the terms of the GNU
10 * General Public License (GPL) Version 2, available from the file
11 * COPYING in the main directory of this source tree, or the
12 * OpenIB.org BSD license below:
13 *
14 * Redistribution and use in source and binary forms, with or
15 * without modification, are permitted provided that the following
16 * conditions are met:
17 *
18 * - Redistributions of source code must retain the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer.
21 *
22 * - Redistributions in binary form must reproduce the above
23 * copyright notice, this list of conditions and the following
24 * disclaimer in the documentation and/or other materials
25 * provided with the distribution.
26 *
27 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
28 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
29 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
30 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
31 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
32 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
33 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 * SOFTWARE.
35 *
36 * $Id: uverbs_main.c 2733 2005-06-28 19:14:34Z roland $
37 */
38
39#include <linux/module.h>
40#include <linux/init.h>
41#include <linux/device.h>
42#include <linux/err.h>
43#include <linux/fs.h>
44#include <linux/poll.h>
45#include <linux/file.h>
46#include <linux/mount.h>
70a30e16 47#include <linux/cdev.h>
bc38a6ab
RD
48
49#include <asm/uaccess.h>
50
51#include "uverbs.h"
52
53MODULE_AUTHOR("Roland Dreier");
54MODULE_DESCRIPTION("InfiniBand userspace verbs access");
55MODULE_LICENSE("Dual BSD/GPL");
56
57#define INFINIBANDEVENTFS_MAGIC 0x49426576 /* "IBev" */
58
59enum {
60 IB_UVERBS_MAJOR = 231,
61 IB_UVERBS_BASE_MINOR = 192,
62 IB_UVERBS_MAX_DEVICES = 32
63};
64
65#define IB_UVERBS_BASE_DEV MKDEV(IB_UVERBS_MAJOR, IB_UVERBS_BASE_MINOR)
66
70a30e16
RD
67static struct class *uverbs_class;
68
95ed644f 69DEFINE_MUTEX(ib_uverbs_idr_mutex);
bc38a6ab
RD
70DEFINE_IDR(ib_uverbs_pd_idr);
71DEFINE_IDR(ib_uverbs_mr_idr);
72DEFINE_IDR(ib_uverbs_mw_idr);
73DEFINE_IDR(ib_uverbs_ah_idr);
74DEFINE_IDR(ib_uverbs_cq_idr);
75DEFINE_IDR(ib_uverbs_qp_idr);
f520ba5a 76DEFINE_IDR(ib_uverbs_srq_idr);
bc38a6ab
RD
77
78static spinlock_t map_lock;
70a30e16 79static struct ib_uverbs_device *dev_table[IB_UVERBS_MAX_DEVICES];
bc38a6ab
RD
80static DECLARE_BITMAP(dev_map, IB_UVERBS_MAX_DEVICES);
81
82static ssize_t (*uverbs_cmd_table[])(struct ib_uverbs_file *file,
83 const char __user *buf, int in_len,
84 int out_len) = {
6b73597e
RD
85 [IB_USER_VERBS_CMD_GET_CONTEXT] = ib_uverbs_get_context,
86 [IB_USER_VERBS_CMD_QUERY_DEVICE] = ib_uverbs_query_device,
87 [IB_USER_VERBS_CMD_QUERY_PORT] = ib_uverbs_query_port,
88 [IB_USER_VERBS_CMD_ALLOC_PD] = ib_uverbs_alloc_pd,
89 [IB_USER_VERBS_CMD_DEALLOC_PD] = ib_uverbs_dealloc_pd,
90 [IB_USER_VERBS_CMD_REG_MR] = ib_uverbs_reg_mr,
91 [IB_USER_VERBS_CMD_DEREG_MR] = ib_uverbs_dereg_mr,
92 [IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL] = ib_uverbs_create_comp_channel,
93 [IB_USER_VERBS_CMD_CREATE_CQ] = ib_uverbs_create_cq,
33b9b3ee 94 [IB_USER_VERBS_CMD_RESIZE_CQ] = ib_uverbs_resize_cq,
67cdb40c
RD
95 [IB_USER_VERBS_CMD_POLL_CQ] = ib_uverbs_poll_cq,
96 [IB_USER_VERBS_CMD_REQ_NOTIFY_CQ] = ib_uverbs_req_notify_cq,
6b73597e
RD
97 [IB_USER_VERBS_CMD_DESTROY_CQ] = ib_uverbs_destroy_cq,
98 [IB_USER_VERBS_CMD_CREATE_QP] = ib_uverbs_create_qp,
7ccc9a24 99 [IB_USER_VERBS_CMD_QUERY_QP] = ib_uverbs_query_qp,
6b73597e
RD
100 [IB_USER_VERBS_CMD_MODIFY_QP] = ib_uverbs_modify_qp,
101 [IB_USER_VERBS_CMD_DESTROY_QP] = ib_uverbs_destroy_qp,
67cdb40c
RD
102 [IB_USER_VERBS_CMD_POST_SEND] = ib_uverbs_post_send,
103 [IB_USER_VERBS_CMD_POST_RECV] = ib_uverbs_post_recv,
104 [IB_USER_VERBS_CMD_POST_SRQ_RECV] = ib_uverbs_post_srq_recv,
105 [IB_USER_VERBS_CMD_CREATE_AH] = ib_uverbs_create_ah,
106 [IB_USER_VERBS_CMD_DESTROY_AH] = ib_uverbs_destroy_ah,
6b73597e
RD
107 [IB_USER_VERBS_CMD_ATTACH_MCAST] = ib_uverbs_attach_mcast,
108 [IB_USER_VERBS_CMD_DETACH_MCAST] = ib_uverbs_detach_mcast,
109 [IB_USER_VERBS_CMD_CREATE_SRQ] = ib_uverbs_create_srq,
110 [IB_USER_VERBS_CMD_MODIFY_SRQ] = ib_uverbs_modify_srq,
8bdb0e86 111 [IB_USER_VERBS_CMD_QUERY_SRQ] = ib_uverbs_query_srq,
6b73597e 112 [IB_USER_VERBS_CMD_DESTROY_SRQ] = ib_uverbs_destroy_srq,
bc38a6ab
RD
113};
114
115static struct vfsmount *uverbs_event_mnt;
116
117static void ib_uverbs_add_one(struct ib_device *device);
118static void ib_uverbs_remove_one(struct ib_device *device);
119
70a30e16
RD
120static void ib_uverbs_release_dev(struct kref *ref)
121{
122 struct ib_uverbs_device *dev =
123 container_of(ref, struct ib_uverbs_device, ref);
124
125 kfree(dev);
126}
127
128void ib_uverbs_release_ucq(struct ib_uverbs_file *file,
129 struct ib_uverbs_event_file *ev_file,
130 struct ib_ucq_object *uobj)
131{
132 struct ib_uverbs_event *evt, *tmp;
133
134 if (ev_file) {
135 spin_lock_irq(&ev_file->lock);
136 list_for_each_entry_safe(evt, tmp, &uobj->comp_list, obj_list) {
137 list_del(&evt->list);
138 kfree(evt);
139 }
140 spin_unlock_irq(&ev_file->lock);
141
142 kref_put(&ev_file->ref, ib_uverbs_release_event_file);
143 }
144
145 spin_lock_irq(&file->async_file->lock);
146 list_for_each_entry_safe(evt, tmp, &uobj->async_list, obj_list) {
147 list_del(&evt->list);
148 kfree(evt);
149 }
150 spin_unlock_irq(&file->async_file->lock);
151}
152
153void ib_uverbs_release_uevent(struct ib_uverbs_file *file,
154 struct ib_uevent_object *uobj)
155{
156 struct ib_uverbs_event *evt, *tmp;
157
158 spin_lock_irq(&file->async_file->lock);
159 list_for_each_entry_safe(evt, tmp, &uobj->event_list, obj_list) {
160 list_del(&evt->list);
161 kfree(evt);
162 }
163 spin_unlock_irq(&file->async_file->lock);
164}
165
f4e40156
JM
166static void ib_uverbs_detach_umcast(struct ib_qp *qp,
167 struct ib_uqp_object *uobj)
168{
169 struct ib_uverbs_mcast_entry *mcast, *tmp;
170
171 list_for_each_entry_safe(mcast, tmp, &uobj->mcast_list, list) {
172 ib_detach_mcast(qp, &mcast->gid, mcast->lid);
173 list_del(&mcast->list);
174 kfree(mcast);
175 }
176}
177
70a30e16
RD
178static int ib_uverbs_cleanup_ucontext(struct ib_uverbs_file *file,
179 struct ib_ucontext *context)
bc38a6ab
RD
180{
181 struct ib_uobject *uobj, *tmp;
182
183 if (!context)
184 return 0;
185
95ed644f 186 mutex_lock(&ib_uverbs_idr_mutex);
bc38a6ab 187
67cdb40c
RD
188 list_for_each_entry_safe(uobj, tmp, &context->ah_list, list) {
189 struct ib_ah *ah = idr_find(&ib_uverbs_ah_idr, uobj->id);
190 idr_remove(&ib_uverbs_ah_idr, uobj->id);
191 ib_destroy_ah(ah);
192 list_del(&uobj->list);
193 kfree(uobj);
194 }
bc38a6ab
RD
195
196 list_for_each_entry_safe(uobj, tmp, &context->qp_list, list) {
197 struct ib_qp *qp = idr_find(&ib_uverbs_qp_idr, uobj->id);
f4e40156
JM
198 struct ib_uqp_object *uqp =
199 container_of(uobj, struct ib_uqp_object, uevent.uobject);
bc38a6ab 200 idr_remove(&ib_uverbs_qp_idr, uobj->id);
f4e40156 201 ib_uverbs_detach_umcast(qp, uqp);
bc38a6ab
RD
202 ib_destroy_qp(qp);
203 list_del(&uobj->list);
f4e40156
JM
204 ib_uverbs_release_uevent(file, &uqp->uevent);
205 kfree(uqp);
bc38a6ab
RD
206 }
207
208 list_for_each_entry_safe(uobj, tmp, &context->cq_list, list) {
209 struct ib_cq *cq = idr_find(&ib_uverbs_cq_idr, uobj->id);
70a30e16
RD
210 struct ib_uverbs_event_file *ev_file = cq->cq_context;
211 struct ib_ucq_object *ucq =
212 container_of(uobj, struct ib_ucq_object, uobject);
bc38a6ab
RD
213 idr_remove(&ib_uverbs_cq_idr, uobj->id);
214 ib_destroy_cq(cq);
215 list_del(&uobj->list);
70a30e16
RD
216 ib_uverbs_release_ucq(file, ev_file, ucq);
217 kfree(ucq);
bc38a6ab
RD
218 }
219
f520ba5a
RD
220 list_for_each_entry_safe(uobj, tmp, &context->srq_list, list) {
221 struct ib_srq *srq = idr_find(&ib_uverbs_srq_idr, uobj->id);
70a30e16
RD
222 struct ib_uevent_object *uevent =
223 container_of(uobj, struct ib_uevent_object, uobject);
f520ba5a
RD
224 idr_remove(&ib_uverbs_srq_idr, uobj->id);
225 ib_destroy_srq(srq);
226 list_del(&uobj->list);
70a30e16
RD
227 ib_uverbs_release_uevent(file, uevent);
228 kfree(uevent);
f520ba5a
RD
229 }
230
bc38a6ab
RD
231 /* XXX Free MWs */
232
233 list_for_each_entry_safe(uobj, tmp, &context->mr_list, list) {
234 struct ib_mr *mr = idr_find(&ib_uverbs_mr_idr, uobj->id);
e1bcfcaa 235 struct ib_device *mrdev = mr->device;
bc38a6ab
RD
236 struct ib_umem_object *memobj;
237
238 idr_remove(&ib_uverbs_mr_idr, uobj->id);
239 ib_dereg_mr(mr);
240
241 memobj = container_of(uobj, struct ib_umem_object, uobject);
e1bcfcaa 242 ib_umem_release_on_close(mrdev, &memobj->umem);
bc38a6ab
RD
243
244 list_del(&uobj->list);
245 kfree(memobj);
246 }
247
248 list_for_each_entry_safe(uobj, tmp, &context->pd_list, list) {
249 struct ib_pd *pd = idr_find(&ib_uverbs_pd_idr, uobj->id);
250 idr_remove(&ib_uverbs_pd_idr, uobj->id);
251 ib_dealloc_pd(pd);
252 list_del(&uobj->list);
253 kfree(uobj);
254 }
255
95ed644f 256 mutex_unlock(&ib_uverbs_idr_mutex);
bc38a6ab
RD
257
258 return context->device->dealloc_ucontext(context);
259}
260
261static void ib_uverbs_release_file(struct kref *ref)
262{
263 struct ib_uverbs_file *file =
264 container_of(ref, struct ib_uverbs_file, ref);
265
266 module_put(file->device->ib_dev->owner);
70a30e16
RD
267 kref_put(&file->device->ref, ib_uverbs_release_dev);
268
bc38a6ab
RD
269 kfree(file);
270}
271
272static ssize_t ib_uverbs_event_read(struct file *filp, char __user *buf,
273 size_t count, loff_t *pos)
274{
275 struct ib_uverbs_event_file *file = filp->private_data;
63aaf647 276 struct ib_uverbs_event *event;
bc38a6ab
RD
277 int eventsz;
278 int ret = 0;
279
280 spin_lock_irq(&file->lock);
281
6b73597e 282 while (list_empty(&file->event_list)) {
bc38a6ab
RD
283 spin_unlock_irq(&file->lock);
284
285 if (filp->f_flags & O_NONBLOCK)
286 return -EAGAIN;
287
288 if (wait_event_interruptible(file->poll_wait,
6b73597e 289 !list_empty(&file->event_list)))
bc38a6ab
RD
290 return -ERESTARTSYS;
291
292 spin_lock_irq(&file->lock);
293 }
294
63aaf647
RD
295 event = list_entry(file->event_list.next, struct ib_uverbs_event, list);
296
297 if (file->is_async)
bc38a6ab 298 eventsz = sizeof (struct ib_uverbs_async_event_desc);
63aaf647 299 else
bc38a6ab 300 eventsz = sizeof (struct ib_uverbs_comp_event_desc);
bc38a6ab
RD
301
302 if (eventsz > count) {
303 ret = -EINVAL;
304 event = NULL;
63aaf647 305 } else {
bc38a6ab 306 list_del(file->event_list.next);
63aaf647
RD
307 if (event->counter) {
308 ++(*event->counter);
309 list_del(&event->obj_list);
310 }
311 }
bc38a6ab
RD
312
313 spin_unlock_irq(&file->lock);
314
315 if (event) {
316 if (copy_to_user(buf, event, eventsz))
317 ret = -EFAULT;
318 else
319 ret = eventsz;
320 }
321
322 kfree(event);
323
324 return ret;
325}
326
327static unsigned int ib_uverbs_event_poll(struct file *filp,
328 struct poll_table_struct *wait)
329{
330 unsigned int pollflags = 0;
331 struct ib_uverbs_event_file *file = filp->private_data;
332
333 poll_wait(filp, &file->poll_wait, wait);
334
335 spin_lock_irq(&file->lock);
6b73597e 336 if (!list_empty(&file->event_list))
bc38a6ab
RD
337 pollflags = POLLIN | POLLRDNORM;
338 spin_unlock_irq(&file->lock);
339
340 return pollflags;
341}
342
6b73597e 343void ib_uverbs_release_event_file(struct kref *ref)
bc38a6ab 344{
6b73597e
RD
345 struct ib_uverbs_event_file *file =
346 container_of(ref, struct ib_uverbs_event_file, ref);
bc38a6ab 347
6b73597e 348 kfree(file);
bc38a6ab
RD
349}
350
abdf119b
GN
351static int ib_uverbs_event_fasync(int fd, struct file *filp, int on)
352{
353 struct ib_uverbs_event_file *file = filp->private_data;
354
355 return fasync_helper(fd, filp, on, &file->async_queue);
356}
357
bc38a6ab
RD
358static int ib_uverbs_event_close(struct inode *inode, struct file *filp)
359{
360 struct ib_uverbs_event_file *file = filp->private_data;
6b73597e
RD
361 struct ib_uverbs_event *entry, *tmp;
362
363 spin_lock_irq(&file->lock);
364 file->file = NULL;
365 list_for_each_entry_safe(entry, tmp, &file->event_list, list) {
366 if (entry->counter)
367 list_del(&entry->obj_list);
368 kfree(entry);
369 }
370 spin_unlock_irq(&file->lock);
bc38a6ab 371
abdf119b 372 ib_uverbs_event_fasync(-1, filp, 0);
6b73597e
RD
373
374 if (file->is_async) {
375 ib_unregister_event_handler(&file->uverbs_file->event_handler);
376 kref_put(&file->uverbs_file->ref, ib_uverbs_release_file);
377 }
378 kref_put(&file->ref, ib_uverbs_release_event_file);
bc38a6ab
RD
379
380 return 0;
381}
382
383static struct file_operations uverbs_event_fops = {
6b73597e 384 .owner = THIS_MODULE,
bc38a6ab
RD
385 .read = ib_uverbs_event_read,
386 .poll = ib_uverbs_event_poll,
abdf119b
GN
387 .release = ib_uverbs_event_close,
388 .fasync = ib_uverbs_event_fasync
bc38a6ab
RD
389};
390
391void ib_uverbs_comp_handler(struct ib_cq *cq, void *cq_context)
392{
6b73597e
RD
393 struct ib_uverbs_event_file *file = cq_context;
394 struct ib_ucq_object *uobj;
395 struct ib_uverbs_event *entry;
396 unsigned long flags;
397
398 if (!file)
399 return;
400
401 spin_lock_irqsave(&file->lock, flags);
402 if (!file->file) {
403 spin_unlock_irqrestore(&file->lock, flags);
404 return;
405 }
bc38a6ab
RD
406
407 entry = kmalloc(sizeof *entry, GFP_ATOMIC);
305a7e87
RD
408 if (!entry) {
409 spin_unlock_irqrestore(&file->lock, flags);
bc38a6ab 410 return;
305a7e87 411 }
bc38a6ab 412
63aaf647
RD
413 uobj = container_of(cq->uobject, struct ib_ucq_object, uobject);
414
415 entry->desc.comp.cq_handle = cq->uobject->user_handle;
416 entry->counter = &uobj->comp_events_reported;
bc38a6ab 417
6b73597e 418 list_add_tail(&entry->list, &file->event_list);
63aaf647 419 list_add_tail(&entry->obj_list, &uobj->comp_list);
6b73597e 420 spin_unlock_irqrestore(&file->lock, flags);
bc38a6ab 421
6b73597e
RD
422 wake_up_interruptible(&file->poll_wait);
423 kill_fasync(&file->async_queue, SIGIO, POLL_IN);
bc38a6ab
RD
424}
425
426static void ib_uverbs_async_handler(struct ib_uverbs_file *file,
63aaf647
RD
427 __u64 element, __u64 event,
428 struct list_head *obj_list,
429 u32 *counter)
bc38a6ab 430{
63aaf647 431 struct ib_uverbs_event *entry;
bc38a6ab
RD
432 unsigned long flags;
433
6b73597e
RD
434 spin_lock_irqsave(&file->async_file->lock, flags);
435 if (!file->async_file->file) {
436 spin_unlock_irqrestore(&file->async_file->lock, flags);
437 return;
438 }
439
bc38a6ab 440 entry = kmalloc(sizeof *entry, GFP_ATOMIC);
305a7e87
RD
441 if (!entry) {
442 spin_unlock_irqrestore(&file->async_file->lock, flags);
bc38a6ab 443 return;
305a7e87 444 }
bc38a6ab 445
63aaf647
RD
446 entry->desc.async.element = element;
447 entry->desc.async.event_type = event;
448 entry->counter = counter;
bc38a6ab 449
6b73597e 450 list_add_tail(&entry->list, &file->async_file->event_list);
63aaf647
RD
451 if (obj_list)
452 list_add_tail(&entry->obj_list, obj_list);
6b73597e 453 spin_unlock_irqrestore(&file->async_file->lock, flags);
bc38a6ab 454
6b73597e
RD
455 wake_up_interruptible(&file->async_file->poll_wait);
456 kill_fasync(&file->async_file->async_queue, SIGIO, POLL_IN);
bc38a6ab
RD
457}
458
459void ib_uverbs_cq_event_handler(struct ib_event *event, void *context_ptr)
460{
7162a3e0
RD
461 struct ib_ucq_object *uobj = container_of(event->element.cq->uobject,
462 struct ib_ucq_object, uobject);
63aaf647 463
7162a3e0 464 ib_uverbs_async_handler(uobj->uverbs_file, uobj->uobject.user_handle,
63aaf647
RD
465 event->event, &uobj->async_list,
466 &uobj->async_events_reported);
bc38a6ab
RD
467}
468
469void ib_uverbs_qp_event_handler(struct ib_event *event, void *context_ptr)
470{
63aaf647
RD
471 struct ib_uevent_object *uobj;
472
473 uobj = container_of(event->element.qp->uobject,
474 struct ib_uevent_object, uobject);
475
476 ib_uverbs_async_handler(context_ptr, uobj->uobject.user_handle,
477 event->event, &uobj->event_list,
478 &uobj->events_reported);
bc38a6ab
RD
479}
480
f520ba5a
RD
481void ib_uverbs_srq_event_handler(struct ib_event *event, void *context_ptr)
482{
63aaf647
RD
483 struct ib_uevent_object *uobj;
484
485 uobj = container_of(event->element.srq->uobject,
486 struct ib_uevent_object, uobject);
487
488 ib_uverbs_async_handler(context_ptr, uobj->uobject.user_handle,
489 event->event, &uobj->event_list,
490 &uobj->events_reported);
f520ba5a
RD
491}
492
6b73597e
RD
493void ib_uverbs_event_handler(struct ib_event_handler *handler,
494 struct ib_event *event)
bc38a6ab
RD
495{
496 struct ib_uverbs_file *file =
497 container_of(handler, struct ib_uverbs_file, event_handler);
498
63aaf647
RD
499 ib_uverbs_async_handler(file, event->element.port_num, event->event,
500 NULL, NULL);
bc38a6ab
RD
501}
502
6b73597e
RD
503struct file *ib_uverbs_alloc_event_file(struct ib_uverbs_file *uverbs_file,
504 int is_async, int *fd)
bc38a6ab 505{
6b73597e 506 struct ib_uverbs_event_file *ev_file;
bc38a6ab 507 struct file *filp;
6b73597e 508 int ret;
bc38a6ab 509
6b73597e
RD
510 ev_file = kmalloc(sizeof *ev_file, GFP_KERNEL);
511 if (!ev_file)
512 return ERR_PTR(-ENOMEM);
513
514 kref_init(&ev_file->ref);
515 spin_lock_init(&ev_file->lock);
516 INIT_LIST_HEAD(&ev_file->event_list);
517 init_waitqueue_head(&ev_file->poll_wait);
518 ev_file->uverbs_file = uverbs_file;
519 ev_file->async_queue = NULL;
520 ev_file->is_async = is_async;
521
522 *fd = get_unused_fd();
523 if (*fd < 0) {
524 ret = *fd;
525 goto err;
526 }
bc38a6ab
RD
527
528 filp = get_empty_filp();
529 if (!filp) {
6b73597e
RD
530 ret = -ENFILE;
531 goto err_fd;
bc38a6ab
RD
532 }
533
6b73597e
RD
534 ev_file->file = filp;
535
536 /*
537 * fops_get() can't fail here, because we're coming from a
538 * system call on a uverbs file, which will already have a
539 * module reference.
540 */
541 filp->f_op = fops_get(&uverbs_event_fops);
bc38a6ab
RD
542 filp->f_vfsmnt = mntget(uverbs_event_mnt);
543 filp->f_dentry = dget(uverbs_event_mnt->mnt_root);
544 filp->f_mapping = filp->f_dentry->d_inode->i_mapping;
545 filp->f_flags = O_RDONLY;
546 filp->f_mode = FMODE_READ;
6b73597e 547 filp->private_data = ev_file;
bc38a6ab 548
6b73597e 549 return filp;
bc38a6ab 550
6b73597e
RD
551err_fd:
552 put_unused_fd(*fd);
553
554err:
555 kfree(ev_file);
556 return ERR_PTR(ret);
557}
558
559/*
560 * Look up a completion event file by FD. If lookup is successful,
561 * takes a ref to the event file struct that it returns; if
562 * unsuccessful, returns NULL.
563 */
564struct ib_uverbs_event_file *ib_uverbs_lookup_comp_file(int fd)
565{
566 struct ib_uverbs_event_file *ev_file = NULL;
567 struct file *filp;
568
569 filp = fget(fd);
570 if (!filp)
571 return NULL;
572
573 if (filp->f_op != &uverbs_event_fops)
574 goto out;
575
576 ev_file = filp->private_data;
577 if (ev_file->is_async) {
578 ev_file = NULL;
579 goto out;
580 }
581
582 kref_get(&ev_file->ref);
583
584out:
585 fput(filp);
586 return ev_file;
bc38a6ab
RD
587}
588
589static ssize_t ib_uverbs_write(struct file *filp, const char __user *buf,
590 size_t count, loff_t *pos)
591{
592 struct ib_uverbs_file *file = filp->private_data;
593 struct ib_uverbs_cmd_hdr hdr;
594
595 if (count < sizeof hdr)
596 return -EINVAL;
597
598 if (copy_from_user(&hdr, buf, sizeof hdr))
599 return -EFAULT;
600
601 if (hdr.in_words * 4 != count)
602 return -EINVAL;
603
63c47c28
RD
604 if (hdr.command < 0 ||
605 hdr.command >= ARRAY_SIZE(uverbs_cmd_table) ||
883a99c7
RD
606 !uverbs_cmd_table[hdr.command] ||
607 !(file->device->ib_dev->uverbs_cmd_mask & (1ull << hdr.command)))
bc38a6ab
RD
608 return -EINVAL;
609
6b73597e 610 if (!file->ucontext &&
bc38a6ab
RD
611 hdr.command != IB_USER_VERBS_CMD_GET_CONTEXT)
612 return -EINVAL;
613
614 return uverbs_cmd_table[hdr.command](file, buf + sizeof hdr,
615 hdr.in_words * 4, hdr.out_words * 4);
616}
617
618static int ib_uverbs_mmap(struct file *filp, struct vm_area_struct *vma)
619{
620 struct ib_uverbs_file *file = filp->private_data;
621
622 if (!file->ucontext)
623 return -ENODEV;
624 else
625 return file->device->ib_dev->mmap(file->ucontext, vma);
626}
627
628static int ib_uverbs_open(struct inode *inode, struct file *filp)
629{
70a30e16 630 struct ib_uverbs_device *dev;
bc38a6ab 631 struct ib_uverbs_file *file;
70a30e16 632 int ret;
bc38a6ab 633
70a30e16
RD
634 spin_lock(&map_lock);
635 dev = dev_table[iminor(inode) - IB_UVERBS_BASE_MINOR];
636 if (dev)
637 kref_get(&dev->ref);
638 spin_unlock(&map_lock);
639
640 if (!dev)
641 return -ENXIO;
642
643 if (!try_module_get(dev->ib_dev->owner)) {
644 ret = -ENODEV;
645 goto err;
646 }
bc38a6ab 647
6b73597e 648 file = kmalloc(sizeof *file, GFP_KERNEL);
63c47c28 649 if (!file) {
70a30e16
RD
650 ret = -ENOMEM;
651 goto err_module;
63c47c28 652 }
bc38a6ab 653
70a30e16
RD
654 file->device = dev;
655 file->ucontext = NULL;
656 file->async_file = NULL;
bc38a6ab 657 kref_init(&file->ref);
95ed644f 658 mutex_init(&file->mutex);
bc38a6ab 659
bc38a6ab
RD
660 filp->private_data = file;
661
bc38a6ab 662 return 0;
70a30e16
RD
663
664err_module:
665 module_put(dev->ib_dev->owner);
666
667err:
668 kref_put(&dev->ref, ib_uverbs_release_dev);
669
670 return ret;
bc38a6ab
RD
671}
672
673static int ib_uverbs_close(struct inode *inode, struct file *filp)
674{
675 struct ib_uverbs_file *file = filp->private_data;
bc38a6ab 676
70a30e16
RD
677 ib_uverbs_cleanup_ucontext(file, file->ucontext);
678
679 if (file->async_file)
680 kref_put(&file->async_file->ref, ib_uverbs_release_event_file);
bc38a6ab 681
bc38a6ab
RD
682 kref_put(&file->ref, ib_uverbs_release_file);
683
684 return 0;
685}
686
687static struct file_operations uverbs_fops = {
688 .owner = THIS_MODULE,
689 .write = ib_uverbs_write,
690 .open = ib_uverbs_open,
691 .release = ib_uverbs_close
692};
693
694static struct file_operations uverbs_mmap_fops = {
695 .owner = THIS_MODULE,
696 .write = ib_uverbs_write,
697 .mmap = ib_uverbs_mmap,
698 .open = ib_uverbs_open,
699 .release = ib_uverbs_close
700};
701
702static struct ib_client uverbs_client = {
703 .name = "uverbs",
704 .add = ib_uverbs_add_one,
705 .remove = ib_uverbs_remove_one
706};
707
708static ssize_t show_ibdev(struct class_device *class_dev, char *buf)
709{
70a30e16
RD
710 struct ib_uverbs_device *dev = class_get_devdata(class_dev);
711
712 if (!dev)
713 return -ENODEV;
bc38a6ab
RD
714
715 return sprintf(buf, "%s\n", dev->ib_dev->name);
716}
717static CLASS_DEVICE_ATTR(ibdev, S_IRUGO, show_ibdev, NULL);
718
274c0891
RD
719static ssize_t show_dev_abi_version(struct class_device *class_dev, char *buf)
720{
70a30e16
RD
721 struct ib_uverbs_device *dev = class_get_devdata(class_dev);
722
723 if (!dev)
724 return -ENODEV;
274c0891
RD
725
726 return sprintf(buf, "%d\n", dev->ib_dev->uverbs_abi_ver);
727}
728static CLASS_DEVICE_ATTR(abi_version, S_IRUGO, show_dev_abi_version, NULL);
729
bc38a6ab
RD
730static ssize_t show_abi_version(struct class *class, char *buf)
731{
732 return sprintf(buf, "%d\n", IB_USER_VERBS_ABI_VERSION);
733}
734static CLASS_ATTR(abi_version, S_IRUGO, show_abi_version, NULL);
735
736static void ib_uverbs_add_one(struct ib_device *device)
737{
738 struct ib_uverbs_device *uverbs_dev;
739
740 if (!device->alloc_ucontext)
741 return;
742
de6eb66b 743 uverbs_dev = kzalloc(sizeof *uverbs_dev, GFP_KERNEL);
bc38a6ab
RD
744 if (!uverbs_dev)
745 return;
746
70a30e16
RD
747 kref_init(&uverbs_dev->ref);
748
bc38a6ab
RD
749 spin_lock(&map_lock);
750 uverbs_dev->devnum = find_first_zero_bit(dev_map, IB_UVERBS_MAX_DEVICES);
751 if (uverbs_dev->devnum >= IB_UVERBS_MAX_DEVICES) {
752 spin_unlock(&map_lock);
753 goto err;
754 }
755 set_bit(uverbs_dev->devnum, dev_map);
756 spin_unlock(&map_lock);
757
6b73597e
RD
758 uverbs_dev->ib_dev = device;
759 uverbs_dev->num_comp_vectors = 1;
bc38a6ab 760
70a30e16
RD
761 uverbs_dev->dev = cdev_alloc();
762 if (!uverbs_dev->dev)
bc38a6ab 763 goto err;
70a30e16
RD
764 uverbs_dev->dev->owner = THIS_MODULE;
765 uverbs_dev->dev->ops = device->mmap ? &uverbs_mmap_fops : &uverbs_fops;
766 kobject_set_name(&uverbs_dev->dev->kobj, "uverbs%d", uverbs_dev->devnum);
767 if (cdev_add(uverbs_dev->dev, IB_UVERBS_BASE_DEV + uverbs_dev->devnum, 1))
768 goto err_cdev;
bc38a6ab 769
4cce3390
RD
770 uverbs_dev->class_dev = class_device_create(uverbs_class, NULL,
771 uverbs_dev->dev->dev,
70a30e16
RD
772 device->dma_device,
773 "uverbs%d", uverbs_dev->devnum);
774 if (IS_ERR(uverbs_dev->class_dev))
bc38a6ab
RD
775 goto err_cdev;
776
70a30e16
RD
777 class_set_devdata(uverbs_dev->class_dev, uverbs_dev);
778
779 if (class_device_create_file(uverbs_dev->class_dev, &class_device_attr_ibdev))
bc38a6ab 780 goto err_class;
70a30e16 781 if (class_device_create_file(uverbs_dev->class_dev, &class_device_attr_abi_version))
274c0891 782 goto err_class;
bc38a6ab 783
70a30e16
RD
784 spin_lock(&map_lock);
785 dev_table[uverbs_dev->devnum] = uverbs_dev;
786 spin_unlock(&map_lock);
787
bc38a6ab
RD
788 ib_set_client_data(device, &uverbs_client, uverbs_dev);
789
790 return;
791
792err_class:
70a30e16 793 class_device_destroy(uverbs_class, uverbs_dev->dev->dev);
bc38a6ab
RD
794
795err_cdev:
70a30e16 796 cdev_del(uverbs_dev->dev);
bc38a6ab
RD
797 clear_bit(uverbs_dev->devnum, dev_map);
798
799err:
70a30e16 800 kref_put(&uverbs_dev->ref, ib_uverbs_release_dev);
bc38a6ab
RD
801 return;
802}
803
804static void ib_uverbs_remove_one(struct ib_device *device)
805{
806 struct ib_uverbs_device *uverbs_dev = ib_get_client_data(device, &uverbs_client);
807
808 if (!uverbs_dev)
809 return;
810
70a30e16
RD
811 class_set_devdata(uverbs_dev->class_dev, NULL);
812 class_device_destroy(uverbs_class, uverbs_dev->dev->dev);
813 cdev_del(uverbs_dev->dev);
814
815 spin_lock(&map_lock);
816 dev_table[uverbs_dev->devnum] = NULL;
817 spin_unlock(&map_lock);
818
819 clear_bit(uverbs_dev->devnum, dev_map);
820 kref_put(&uverbs_dev->ref, ib_uverbs_release_dev);
bc38a6ab
RD
821}
822
823static struct super_block *uverbs_event_get_sb(struct file_system_type *fs_type, int flags,
824 const char *dev_name, void *data)
825{
826 return get_sb_pseudo(fs_type, "infinibandevent:", NULL,
827 INFINIBANDEVENTFS_MAGIC);
828}
829
830static struct file_system_type uverbs_event_fs = {
831 /* No owner field so module can be unloaded */
832 .name = "infinibandeventfs",
833 .get_sb = uverbs_event_get_sb,
834 .kill_sb = kill_litter_super
835};
836
837static int __init ib_uverbs_init(void)
838{
839 int ret;
840
841 spin_lock_init(&map_lock);
842
843 ret = register_chrdev_region(IB_UVERBS_BASE_DEV, IB_UVERBS_MAX_DEVICES,
844 "infiniband_verbs");
845 if (ret) {
846 printk(KERN_ERR "user_verbs: couldn't register device number\n");
847 goto out;
848 }
849
70a30e16
RD
850 uverbs_class = class_create(THIS_MODULE, "infiniband_verbs");
851 if (IS_ERR(uverbs_class)) {
852 ret = PTR_ERR(uverbs_class);
bc38a6ab
RD
853 printk(KERN_ERR "user_verbs: couldn't create class infiniband_verbs\n");
854 goto out_chrdev;
855 }
856
70a30e16 857 ret = class_create_file(uverbs_class, &class_attr_abi_version);
bc38a6ab
RD
858 if (ret) {
859 printk(KERN_ERR "user_verbs: couldn't create abi_version attribute\n");
860 goto out_class;
861 }
862
863 ret = register_filesystem(&uverbs_event_fs);
864 if (ret) {
865 printk(KERN_ERR "user_verbs: couldn't register infinibandeventfs\n");
866 goto out_class;
867 }
868
869 uverbs_event_mnt = kern_mount(&uverbs_event_fs);
870 if (IS_ERR(uverbs_event_mnt)) {
871 ret = PTR_ERR(uverbs_event_mnt);
872 printk(KERN_ERR "user_verbs: couldn't mount infinibandeventfs\n");
873 goto out_fs;
874 }
875
876 ret = ib_register_client(&uverbs_client);
877 if (ret) {
878 printk(KERN_ERR "user_verbs: couldn't register client\n");
879 goto out_mnt;
880 }
881
882 return 0;
883
884out_mnt:
885 mntput(uverbs_event_mnt);
886
887out_fs:
888 unregister_filesystem(&uverbs_event_fs);
889
890out_class:
70a30e16 891 class_destroy(uverbs_class);
bc38a6ab
RD
892
893out_chrdev:
894 unregister_chrdev_region(IB_UVERBS_BASE_DEV, IB_UVERBS_MAX_DEVICES);
895
896out:
897 return ret;
898}
899
900static void __exit ib_uverbs_cleanup(void)
901{
902 ib_unregister_client(&uverbs_client);
903 mntput(uverbs_event_mnt);
904 unregister_filesystem(&uverbs_event_fs);
70a30e16 905 class_destroy(uverbs_class);
bc38a6ab 906 unregister_chrdev_region(IB_UVERBS_BASE_DEV, IB_UVERBS_MAX_DEVICES);
cc76e33e 907 flush_scheduled_work();
5d7edb3c
RD
908 idr_destroy(&ib_uverbs_pd_idr);
909 idr_destroy(&ib_uverbs_mr_idr);
910 idr_destroy(&ib_uverbs_mw_idr);
911 idr_destroy(&ib_uverbs_ah_idr);
912 idr_destroy(&ib_uverbs_cq_idr);
913 idr_destroy(&ib_uverbs_qp_idr);
914 idr_destroy(&ib_uverbs_srq_idr);
bc38a6ab
RD
915}
916
917module_init(ib_uverbs_init);
918module_exit(ib_uverbs_cleanup);