RDMA/cma: Listen on specific address family
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / drivers / infiniband / core / cma.c
CommitLineData
e51060f0
SH
1/*
2 * Copyright (c) 2005 Voltaire Inc. All rights reserved.
3 * Copyright (c) 2002-2005, Network Appliance, Inc. All rights reserved.
4 * Copyright (c) 1999-2005, Mellanox Technologies, Inc. All rights reserved.
5 * Copyright (c) 2005-2006 Intel Corporation. All rights reserved.
6 *
a9474917
SH
7 * This software is available to you under a choice of one of two
8 * licenses. You may choose to be licensed under the terms of the GNU
9 * General Public License (GPL) Version 2, available from the file
10 * COPYING in the main directory of this source tree, or the
11 * OpenIB.org BSD license below:
e51060f0 12 *
a9474917
SH
13 * Redistribution and use in source and binary forms, with or
14 * without modification, are permitted provided that the following
15 * conditions are met:
e51060f0 16 *
a9474917
SH
17 * - Redistributions of source code must retain the above
18 * copyright notice, this list of conditions and the following
19 * disclaimer.
e51060f0 20 *
a9474917
SH
21 * - Redistributions in binary form must reproduce the above
22 * copyright notice, this list of conditions and the following
23 * disclaimer in the documentation and/or other materials
24 * provided with the distribution.
e51060f0 25 *
a9474917
SH
26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33 * SOFTWARE.
e51060f0
SH
34 */
35
36#include <linux/completion.h>
37#include <linux/in.h>
38#include <linux/in6.h>
39#include <linux/mutex.h>
40#include <linux/random.h>
41#include <linux/idr.h>
07ebafba 42#include <linux/inetdevice.h>
5a0e3ad6 43#include <linux/slab.h>
e4dd23d7 44#include <linux/module.h>
366cddb4 45#include <net/route.h>
e51060f0
SH
46
47#include <net/tcp.h>
1f5175ad 48#include <net/ipv6.h>
e51060f0
SH
49
50#include <rdma/rdma_cm.h>
51#include <rdma/rdma_cm_ib.h>
753f618a 52#include <rdma/rdma_netlink.h>
e51060f0
SH
53#include <rdma/ib_cache.h>
54#include <rdma/ib_cm.h>
55#include <rdma/ib_sa.h>
07ebafba 56#include <rdma/iw_cm.h>
e51060f0
SH
57
58MODULE_AUTHOR("Sean Hefty");
59MODULE_DESCRIPTION("Generic RDMA CM Agent");
60MODULE_LICENSE("Dual BSD/GPL");
61
62#define CMA_CM_RESPONSE_TIMEOUT 20
d5bb7599 63#define CMA_MAX_CM_RETRIES 15
dcb3f974 64#define CMA_CM_MRA_SETTING (IB_CM_MRA_FLAG_DELAY | 24)
3c86aa70 65#define CMA_IBOE_PACKET_LIFETIME 18
e51060f0
SH
66
67static void cma_add_one(struct ib_device *device);
68static void cma_remove_one(struct ib_device *device);
69
70static struct ib_client cma_client = {
71 .name = "cma",
72 .add = cma_add_one,
73 .remove = cma_remove_one
74};
75
c1a0b23b 76static struct ib_sa_client sa_client;
7a118df3 77static struct rdma_addr_client addr_client;
e51060f0
SH
78static LIST_HEAD(dev_list);
79static LIST_HEAD(listen_any_list);
80static DEFINE_MUTEX(lock);
81static struct workqueue_struct *cma_wq;
82static DEFINE_IDR(sdp_ps);
83static DEFINE_IDR(tcp_ps);
628e5f6d 84static DEFINE_IDR(udp_ps);
c8f6a362 85static DEFINE_IDR(ipoib_ps);
2d2e9415 86static DEFINE_IDR(ib_ps);
e51060f0
SH
87
88struct cma_device {
89 struct list_head list;
90 struct ib_device *device;
e51060f0
SH
91 struct completion comp;
92 atomic_t refcount;
93 struct list_head id_list;
94};
95
e51060f0
SH
96struct rdma_bind_list {
97 struct idr *ps;
98 struct hlist_head owners;
99 unsigned short port;
100};
101
102/*
103 * Device removal can occur at anytime, so we need extra handling to
104 * serialize notifying the user of device removal with other callbacks.
105 * We do this by disabling removal notification while a callback is in process,
106 * and reporting it after the callback completes.
107 */
108struct rdma_id_private {
109 struct rdma_cm_id id;
110
111 struct rdma_bind_list *bind_list;
112 struct hlist_node node;
d02d1f53
SH
113 struct list_head list; /* listen_any_list or cma_device.list */
114 struct list_head listen_list; /* per device listens */
e51060f0 115 struct cma_device *cma_dev;
c8f6a362 116 struct list_head mc_list;
e51060f0 117
d02d1f53 118 int internal_id;
550e5ca7 119 enum rdma_cm_state state;
e51060f0 120 spinlock_t lock;
c5483388
SH
121 struct mutex qp_mutex;
122
e51060f0
SH
123 struct completion comp;
124 atomic_t refcount;
de910bd9 125 struct mutex handler_mutex;
e51060f0
SH
126
127 int backlog;
128 int timeout_ms;
129 struct ib_sa_query *query;
130 int query_id;
131 union {
132 struct ib_cm_id *ib;
07ebafba 133 struct iw_cm_id *iw;
e51060f0
SH
134 } cm_id;
135
136 u32 seq_num;
c8f6a362 137 u32 qkey;
e51060f0 138 u32 qp_num;
83e9502d 139 pid_t owner;
e51060f0 140 u8 srq;
a81c994d 141 u8 tos;
a9bb7912 142 u8 reuseaddr;
5b0ec991 143 u8 afonly;
e51060f0
SH
144};
145
c8f6a362
SH
146struct cma_multicast {
147 struct rdma_id_private *id_priv;
148 union {
149 struct ib_sa_multicast *ib;
150 } multicast;
151 struct list_head list;
152 void *context;
3f446754 153 struct sockaddr_storage addr;
3c86aa70 154 struct kref mcref;
c8f6a362
SH
155};
156
e51060f0
SH
157struct cma_work {
158 struct work_struct work;
159 struct rdma_id_private *id;
550e5ca7
NM
160 enum rdma_cm_state old_state;
161 enum rdma_cm_state new_state;
e51060f0
SH
162 struct rdma_cm_event event;
163};
164
dd5bdff8
OG
165struct cma_ndev_work {
166 struct work_struct work;
167 struct rdma_id_private *id;
168 struct rdma_cm_event event;
169};
170
3c86aa70
EC
171struct iboe_mcast_work {
172 struct work_struct work;
173 struct rdma_id_private *id;
174 struct cma_multicast *mc;
175};
176
e51060f0
SH
177union cma_ip_addr {
178 struct in6_addr ip6;
179 struct {
1b90c137
AV
180 __be32 pad[3];
181 __be32 addr;
e51060f0
SH
182 } ip4;
183};
184
185struct cma_hdr {
186 u8 cma_version;
187 u8 ip_version; /* IP version: 7:4 */
1b90c137 188 __be16 port;
e51060f0
SH
189 union cma_ip_addr src_addr;
190 union cma_ip_addr dst_addr;
191};
192
193struct sdp_hh {
194 u8 bsdh[16];
195 u8 sdp_version; /* Major version: 7:4 */
196 u8 ip_version; /* IP version: 7:4 */
197 u8 sdp_specific1[10];
1b90c137
AV
198 __be16 port;
199 __be16 sdp_specific2;
e51060f0
SH
200 union cma_ip_addr src_addr;
201 union cma_ip_addr dst_addr;
202};
203
204struct sdp_hah {
205 u8 bsdh[16];
206 u8 sdp_version;
207};
208
209#define CMA_VERSION 0x00
210#define SDP_MAJ_VERSION 0x2
211
550e5ca7 212static int cma_comp(struct rdma_id_private *id_priv, enum rdma_cm_state comp)
e51060f0
SH
213{
214 unsigned long flags;
215 int ret;
216
217 spin_lock_irqsave(&id_priv->lock, flags);
218 ret = (id_priv->state == comp);
219 spin_unlock_irqrestore(&id_priv->lock, flags);
220 return ret;
221}
222
223static int cma_comp_exch(struct rdma_id_private *id_priv,
550e5ca7 224 enum rdma_cm_state comp, enum rdma_cm_state exch)
e51060f0
SH
225{
226 unsigned long flags;
227 int ret;
228
229 spin_lock_irqsave(&id_priv->lock, flags);
230 if ((ret = (id_priv->state == comp)))
231 id_priv->state = exch;
232 spin_unlock_irqrestore(&id_priv->lock, flags);
233 return ret;
234}
235
550e5ca7
NM
236static enum rdma_cm_state cma_exch(struct rdma_id_private *id_priv,
237 enum rdma_cm_state exch)
e51060f0
SH
238{
239 unsigned long flags;
550e5ca7 240 enum rdma_cm_state old;
e51060f0
SH
241
242 spin_lock_irqsave(&id_priv->lock, flags);
243 old = id_priv->state;
244 id_priv->state = exch;
245 spin_unlock_irqrestore(&id_priv->lock, flags);
246 return old;
247}
248
249static inline u8 cma_get_ip_ver(struct cma_hdr *hdr)
250{
251 return hdr->ip_version >> 4;
252}
253
254static inline void cma_set_ip_ver(struct cma_hdr *hdr, u8 ip_ver)
255{
256 hdr->ip_version = (ip_ver << 4) | (hdr->ip_version & 0xF);
257}
258
259static inline u8 sdp_get_majv(u8 sdp_version)
260{
261 return sdp_version >> 4;
262}
263
264static inline u8 sdp_get_ip_ver(struct sdp_hh *hh)
265{
266 return hh->ip_version >> 4;
267}
268
269static inline void sdp_set_ip_ver(struct sdp_hh *hh, u8 ip_ver)
270{
271 hh->ip_version = (ip_ver << 4) | (hh->ip_version & 0xF);
272}
273
274static void cma_attach_to_dev(struct rdma_id_private *id_priv,
275 struct cma_device *cma_dev)
276{
277 atomic_inc(&cma_dev->refcount);
278 id_priv->cma_dev = cma_dev;
279 id_priv->id.device = cma_dev->device;
3c86aa70
EC
280 id_priv->id.route.addr.dev_addr.transport =
281 rdma_node_get_transport(cma_dev->device->node_type);
e51060f0
SH
282 list_add_tail(&id_priv->list, &cma_dev->id_list);
283}
284
285static inline void cma_deref_dev(struct cma_device *cma_dev)
286{
287 if (atomic_dec_and_test(&cma_dev->refcount))
288 complete(&cma_dev->comp);
289}
290
3c86aa70
EC
291static inline void release_mc(struct kref *kref)
292{
293 struct cma_multicast *mc = container_of(kref, struct cma_multicast, mcref);
294
295 kfree(mc->multicast.ib);
296 kfree(mc);
297}
298
a396d43a 299static void cma_release_dev(struct rdma_id_private *id_priv)
e51060f0 300{
a396d43a 301 mutex_lock(&lock);
e51060f0
SH
302 list_del(&id_priv->list);
303 cma_deref_dev(id_priv->cma_dev);
304 id_priv->cma_dev = NULL;
a396d43a 305 mutex_unlock(&lock);
e51060f0
SH
306}
307
d2ca39f2 308static int cma_set_qkey(struct rdma_id_private *id_priv)
c8f6a362
SH
309{
310 struct ib_sa_mcmember_rec rec;
311 int ret = 0;
312
d2ca39f2
YE
313 if (id_priv->qkey)
314 return 0;
315
316 switch (id_priv->id.ps) {
c8f6a362 317 case RDMA_PS_UDP:
d2ca39f2 318 id_priv->qkey = RDMA_UDP_QKEY;
c8f6a362
SH
319 break;
320 case RDMA_PS_IPOIB:
d2ca39f2
YE
321 ib_addr_get_mgid(&id_priv->id.route.addr.dev_addr, &rec.mgid);
322 ret = ib_sa_get_mcmember_rec(id_priv->id.device,
323 id_priv->id.port_num, &rec.mgid,
324 &rec);
325 if (!ret)
326 id_priv->qkey = be32_to_cpu(rec.qkey);
c8f6a362
SH
327 break;
328 default:
329 break;
330 }
331 return ret;
332}
333
3c86aa70
EC
334static int find_gid_port(struct ib_device *device, union ib_gid *gid, u8 port_num)
335{
336 int i;
337 int err;
338 struct ib_port_attr props;
339 union ib_gid tmp;
340
341 err = ib_query_port(device, port_num, &props);
342 if (err)
343 return 1;
344
345 for (i = 0; i < props.gid_tbl_len; ++i) {
346 err = ib_query_gid(device, port_num, i, &tmp);
347 if (err)
348 return 1;
349 if (!memcmp(&tmp, gid, sizeof tmp))
350 return 0;
351 }
352
353 return -EAGAIN;
354}
355
07ebafba 356static int cma_acquire_dev(struct rdma_id_private *id_priv)
e51060f0 357{
c8f6a362 358 struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
e51060f0 359 struct cma_device *cma_dev;
3c86aa70 360 union ib_gid gid, iboe_gid;
e51060f0 361 int ret = -ENODEV;
3c86aa70
EC
362 u8 port;
363 enum rdma_link_layer dev_ll = dev_addr->dev_type == ARPHRD_INFINIBAND ?
364 IB_LINK_LAYER_INFINIBAND : IB_LINK_LAYER_ETHERNET;
e51060f0 365
2efdd6a0
MS
366 if (dev_ll != IB_LINK_LAYER_INFINIBAND &&
367 id_priv->id.ps == RDMA_PS_IPOIB)
368 return -EINVAL;
369
a396d43a 370 mutex_lock(&lock);
3c86aa70
EC
371 iboe_addr_get_sgid(dev_addr, &iboe_gid);
372 memcpy(&gid, dev_addr->src_dev_addr +
373 rdma_addr_gid_offset(dev_addr), sizeof gid);
e51060f0 374 list_for_each_entry(cma_dev, &dev_list, list) {
3c86aa70
EC
375 for (port = 1; port <= cma_dev->device->phys_port_cnt; ++port) {
376 if (rdma_port_get_link_layer(cma_dev->device, port) == dev_ll) {
377 if (rdma_node_get_transport(cma_dev->device->node_type) == RDMA_TRANSPORT_IB &&
378 rdma_port_get_link_layer(cma_dev->device, port) == IB_LINK_LAYER_ETHERNET)
379 ret = find_gid_port(cma_dev->device, &iboe_gid, port);
380 else
381 ret = find_gid_port(cma_dev->device, &gid, port);
382
383 if (!ret) {
384 id_priv->id.port_num = port;
385 goto out;
386 } else if (ret == 1)
387 break;
388 }
e51060f0
SH
389 }
390 }
3c86aa70
EC
391
392out:
393 if (!ret)
394 cma_attach_to_dev(id_priv, cma_dev);
395
a396d43a 396 mutex_unlock(&lock);
e51060f0
SH
397 return ret;
398}
399
e51060f0
SH
400static void cma_deref_id(struct rdma_id_private *id_priv)
401{
402 if (atomic_dec_and_test(&id_priv->refcount))
403 complete(&id_priv->comp);
404}
405
de910bd9 406static int cma_disable_callback(struct rdma_id_private *id_priv,
550e5ca7 407 enum rdma_cm_state state)
8aa08602 408{
de910bd9
OG
409 mutex_lock(&id_priv->handler_mutex);
410 if (id_priv->state != state) {
411 mutex_unlock(&id_priv->handler_mutex);
412 return -EINVAL;
413 }
414 return 0;
e51060f0
SH
415}
416
417struct rdma_cm_id *rdma_create_id(rdma_cm_event_handler event_handler,
b26f9b99
SH
418 void *context, enum rdma_port_space ps,
419 enum ib_qp_type qp_type)
e51060f0
SH
420{
421 struct rdma_id_private *id_priv;
422
423 id_priv = kzalloc(sizeof *id_priv, GFP_KERNEL);
424 if (!id_priv)
425 return ERR_PTR(-ENOMEM);
426
83e9502d 427 id_priv->owner = task_pid_nr(current);
550e5ca7 428 id_priv->state = RDMA_CM_IDLE;
e51060f0
SH
429 id_priv->id.context = context;
430 id_priv->id.event_handler = event_handler;
431 id_priv->id.ps = ps;
b26f9b99 432 id_priv->id.qp_type = qp_type;
e51060f0 433 spin_lock_init(&id_priv->lock);
c5483388 434 mutex_init(&id_priv->qp_mutex);
e51060f0
SH
435 init_completion(&id_priv->comp);
436 atomic_set(&id_priv->refcount, 1);
de910bd9 437 mutex_init(&id_priv->handler_mutex);
e51060f0 438 INIT_LIST_HEAD(&id_priv->listen_list);
c8f6a362 439 INIT_LIST_HEAD(&id_priv->mc_list);
e51060f0
SH
440 get_random_bytes(&id_priv->seq_num, sizeof id_priv->seq_num);
441
442 return &id_priv->id;
443}
444EXPORT_SYMBOL(rdma_create_id);
445
c8f6a362 446static int cma_init_ud_qp(struct rdma_id_private *id_priv, struct ib_qp *qp)
e51060f0
SH
447{
448 struct ib_qp_attr qp_attr;
c8f6a362 449 int qp_attr_mask, ret;
e51060f0 450
c8f6a362
SH
451 qp_attr.qp_state = IB_QPS_INIT;
452 ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
e51060f0
SH
453 if (ret)
454 return ret;
455
c8f6a362
SH
456 ret = ib_modify_qp(qp, &qp_attr, qp_attr_mask);
457 if (ret)
458 return ret;
459
460 qp_attr.qp_state = IB_QPS_RTR;
461 ret = ib_modify_qp(qp, &qp_attr, IB_QP_STATE);
462 if (ret)
463 return ret;
464
465 qp_attr.qp_state = IB_QPS_RTS;
466 qp_attr.sq_psn = 0;
467 ret = ib_modify_qp(qp, &qp_attr, IB_QP_STATE | IB_QP_SQ_PSN);
468
469 return ret;
e51060f0
SH
470}
471
c8f6a362 472static int cma_init_conn_qp(struct rdma_id_private *id_priv, struct ib_qp *qp)
07ebafba
TT
473{
474 struct ib_qp_attr qp_attr;
c8f6a362 475 int qp_attr_mask, ret;
07ebafba
TT
476
477 qp_attr.qp_state = IB_QPS_INIT;
c8f6a362
SH
478 ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
479 if (ret)
480 return ret;
07ebafba 481
c8f6a362 482 return ib_modify_qp(qp, &qp_attr, qp_attr_mask);
07ebafba
TT
483}
484
e51060f0
SH
485int rdma_create_qp(struct rdma_cm_id *id, struct ib_pd *pd,
486 struct ib_qp_init_attr *qp_init_attr)
487{
488 struct rdma_id_private *id_priv;
489 struct ib_qp *qp;
490 int ret;
491
492 id_priv = container_of(id, struct rdma_id_private, id);
493 if (id->device != pd->device)
494 return -EINVAL;
495
496 qp = ib_create_qp(pd, qp_init_attr);
497 if (IS_ERR(qp))
498 return PTR_ERR(qp);
499
b26f9b99 500 if (id->qp_type == IB_QPT_UD)
c8f6a362
SH
501 ret = cma_init_ud_qp(id_priv, qp);
502 else
503 ret = cma_init_conn_qp(id_priv, qp);
e51060f0
SH
504 if (ret)
505 goto err;
506
507 id->qp = qp;
508 id_priv->qp_num = qp->qp_num;
e51060f0
SH
509 id_priv->srq = (qp->srq != NULL);
510 return 0;
511err:
512 ib_destroy_qp(qp);
513 return ret;
514}
515EXPORT_SYMBOL(rdma_create_qp);
516
517void rdma_destroy_qp(struct rdma_cm_id *id)
518{
c5483388
SH
519 struct rdma_id_private *id_priv;
520
521 id_priv = container_of(id, struct rdma_id_private, id);
522 mutex_lock(&id_priv->qp_mutex);
523 ib_destroy_qp(id_priv->id.qp);
524 id_priv->id.qp = NULL;
525 mutex_unlock(&id_priv->qp_mutex);
e51060f0
SH
526}
527EXPORT_SYMBOL(rdma_destroy_qp);
528
5851bb89
SH
529static int cma_modify_qp_rtr(struct rdma_id_private *id_priv,
530 struct rdma_conn_param *conn_param)
e51060f0
SH
531{
532 struct ib_qp_attr qp_attr;
533 int qp_attr_mask, ret;
534
c5483388
SH
535 mutex_lock(&id_priv->qp_mutex);
536 if (!id_priv->id.qp) {
537 ret = 0;
538 goto out;
539 }
e51060f0
SH
540
541 /* Need to update QP attributes from default values. */
542 qp_attr.qp_state = IB_QPS_INIT;
c5483388 543 ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
e51060f0 544 if (ret)
c5483388 545 goto out;
e51060f0 546
c5483388 547 ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
e51060f0 548 if (ret)
c5483388 549 goto out;
e51060f0
SH
550
551 qp_attr.qp_state = IB_QPS_RTR;
c5483388 552 ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
e51060f0 553 if (ret)
c5483388 554 goto out;
e51060f0 555
5851bb89
SH
556 if (conn_param)
557 qp_attr.max_dest_rd_atomic = conn_param->responder_resources;
c5483388
SH
558 ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
559out:
560 mutex_unlock(&id_priv->qp_mutex);
561 return ret;
e51060f0
SH
562}
563
5851bb89
SH
564static int cma_modify_qp_rts(struct rdma_id_private *id_priv,
565 struct rdma_conn_param *conn_param)
e51060f0
SH
566{
567 struct ib_qp_attr qp_attr;
568 int qp_attr_mask, ret;
569
c5483388
SH
570 mutex_lock(&id_priv->qp_mutex);
571 if (!id_priv->id.qp) {
572 ret = 0;
573 goto out;
574 }
e51060f0
SH
575
576 qp_attr.qp_state = IB_QPS_RTS;
c5483388 577 ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
e51060f0 578 if (ret)
c5483388 579 goto out;
e51060f0 580
5851bb89
SH
581 if (conn_param)
582 qp_attr.max_rd_atomic = conn_param->initiator_depth;
c5483388
SH
583 ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
584out:
585 mutex_unlock(&id_priv->qp_mutex);
586 return ret;
e51060f0
SH
587}
588
c5483388 589static int cma_modify_qp_err(struct rdma_id_private *id_priv)
e51060f0
SH
590{
591 struct ib_qp_attr qp_attr;
c5483388 592 int ret;
e51060f0 593
c5483388
SH
594 mutex_lock(&id_priv->qp_mutex);
595 if (!id_priv->id.qp) {
596 ret = 0;
597 goto out;
598 }
e51060f0
SH
599
600 qp_attr.qp_state = IB_QPS_ERR;
c5483388
SH
601 ret = ib_modify_qp(id_priv->id.qp, &qp_attr, IB_QP_STATE);
602out:
603 mutex_unlock(&id_priv->qp_mutex);
604 return ret;
e51060f0
SH
605}
606
c8f6a362
SH
607static int cma_ib_init_qp_attr(struct rdma_id_private *id_priv,
608 struct ib_qp_attr *qp_attr, int *qp_attr_mask)
609{
610 struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
611 int ret;
3c86aa70
EC
612 u16 pkey;
613
614 if (rdma_port_get_link_layer(id_priv->id.device, id_priv->id.port_num) ==
615 IB_LINK_LAYER_INFINIBAND)
616 pkey = ib_addr_get_pkey(dev_addr);
617 else
618 pkey = 0xffff;
c8f6a362
SH
619
620 ret = ib_find_cached_pkey(id_priv->id.device, id_priv->id.port_num,
3c86aa70 621 pkey, &qp_attr->pkey_index);
c8f6a362
SH
622 if (ret)
623 return ret;
624
625 qp_attr->port_num = id_priv->id.port_num;
626 *qp_attr_mask = IB_QP_STATE | IB_QP_PKEY_INDEX | IB_QP_PORT;
627
b26f9b99 628 if (id_priv->id.qp_type == IB_QPT_UD) {
d2ca39f2
YE
629 ret = cma_set_qkey(id_priv);
630 if (ret)
631 return ret;
632
c8f6a362
SH
633 qp_attr->qkey = id_priv->qkey;
634 *qp_attr_mask |= IB_QP_QKEY;
635 } else {
636 qp_attr->qp_access_flags = 0;
637 *qp_attr_mask |= IB_QP_ACCESS_FLAGS;
638 }
639 return 0;
640}
641
e51060f0
SH
642int rdma_init_qp_attr(struct rdma_cm_id *id, struct ib_qp_attr *qp_attr,
643 int *qp_attr_mask)
644{
645 struct rdma_id_private *id_priv;
c8f6a362 646 int ret = 0;
e51060f0
SH
647
648 id_priv = container_of(id, struct rdma_id_private, id);
07ebafba
TT
649 switch (rdma_node_get_transport(id_priv->id.device->node_type)) {
650 case RDMA_TRANSPORT_IB:
b26f9b99 651 if (!id_priv->cm_id.ib || (id_priv->id.qp_type == IB_QPT_UD))
c8f6a362
SH
652 ret = cma_ib_init_qp_attr(id_priv, qp_attr, qp_attr_mask);
653 else
654 ret = ib_cm_init_qp_attr(id_priv->cm_id.ib, qp_attr,
655 qp_attr_mask);
e51060f0
SH
656 if (qp_attr->qp_state == IB_QPS_RTR)
657 qp_attr->rq_psn = id_priv->seq_num;
658 break;
07ebafba 659 case RDMA_TRANSPORT_IWARP:
c8f6a362 660 if (!id_priv->cm_id.iw) {
8f076531 661 qp_attr->qp_access_flags = 0;
c8f6a362
SH
662 *qp_attr_mask = IB_QP_STATE | IB_QP_ACCESS_FLAGS;
663 } else
664 ret = iw_cm_init_qp_attr(id_priv->cm_id.iw, qp_attr,
665 qp_attr_mask);
07ebafba 666 break;
e51060f0
SH
667 default:
668 ret = -ENOSYS;
669 break;
670 }
671
672 return ret;
673}
674EXPORT_SYMBOL(rdma_init_qp_attr);
675
676static inline int cma_zero_addr(struct sockaddr *addr)
677{
678 struct in6_addr *ip6;
679
680 if (addr->sa_family == AF_INET)
6360a02a
JP
681 return ipv4_is_zeronet(
682 ((struct sockaddr_in *)addr)->sin_addr.s_addr);
e51060f0
SH
683 else {
684 ip6 = &((struct sockaddr_in6 *) addr)->sin6_addr;
685 return (ip6->s6_addr32[0] | ip6->s6_addr32[1] |
5fd571cb 686 ip6->s6_addr32[2] | ip6->s6_addr32[3]) == 0;
e51060f0
SH
687 }
688}
689
690static inline int cma_loopback_addr(struct sockaddr *addr)
691{
1f5175ad
AS
692 if (addr->sa_family == AF_INET)
693 return ipv4_is_loopback(
694 ((struct sockaddr_in *) addr)->sin_addr.s_addr);
695 else
696 return ipv6_addr_loopback(
697 &((struct sockaddr_in6 *) addr)->sin6_addr);
e51060f0
SH
698}
699
700static inline int cma_any_addr(struct sockaddr *addr)
701{
702 return cma_zero_addr(addr) || cma_loopback_addr(addr);
703}
704
43b752da
HS
705static int cma_addr_cmp(struct sockaddr *src, struct sockaddr *dst)
706{
707 if (src->sa_family != dst->sa_family)
708 return -1;
709
710 switch (src->sa_family) {
711 case AF_INET:
712 return ((struct sockaddr_in *) src)->sin_addr.s_addr !=
713 ((struct sockaddr_in *) dst)->sin_addr.s_addr;
714 default:
715 return ipv6_addr_cmp(&((struct sockaddr_in6 *) src)->sin6_addr,
716 &((struct sockaddr_in6 *) dst)->sin6_addr);
717 }
718}
719
628e5f6d
SH
720static inline __be16 cma_port(struct sockaddr *addr)
721{
722 if (addr->sa_family == AF_INET)
723 return ((struct sockaddr_in *) addr)->sin_port;
724 else
725 return ((struct sockaddr_in6 *) addr)->sin6_port;
726}
727
e51060f0
SH
728static inline int cma_any_port(struct sockaddr *addr)
729{
628e5f6d 730 return !cma_port(addr);
e51060f0
SH
731}
732
733static int cma_get_net_info(void *hdr, enum rdma_port_space ps,
1b90c137 734 u8 *ip_ver, __be16 *port,
e51060f0
SH
735 union cma_ip_addr **src, union cma_ip_addr **dst)
736{
737 switch (ps) {
738 case RDMA_PS_SDP:
739 if (sdp_get_majv(((struct sdp_hh *) hdr)->sdp_version) !=
740 SDP_MAJ_VERSION)
741 return -EINVAL;
742
743 *ip_ver = sdp_get_ip_ver(hdr);
744 *port = ((struct sdp_hh *) hdr)->port;
745 *src = &((struct sdp_hh *) hdr)->src_addr;
746 *dst = &((struct sdp_hh *) hdr)->dst_addr;
747 break;
748 default:
749 if (((struct cma_hdr *) hdr)->cma_version != CMA_VERSION)
750 return -EINVAL;
751
752 *ip_ver = cma_get_ip_ver(hdr);
753 *port = ((struct cma_hdr *) hdr)->port;
754 *src = &((struct cma_hdr *) hdr)->src_addr;
755 *dst = &((struct cma_hdr *) hdr)->dst_addr;
756 break;
757 }
758
759 if (*ip_ver != 4 && *ip_ver != 6)
760 return -EINVAL;
761 return 0;
762}
763
764static void cma_save_net_info(struct rdma_addr *addr,
765 struct rdma_addr *listen_addr,
1b90c137 766 u8 ip_ver, __be16 port,
e51060f0
SH
767 union cma_ip_addr *src, union cma_ip_addr *dst)
768{
769 struct sockaddr_in *listen4, *ip4;
770 struct sockaddr_in6 *listen6, *ip6;
771
772 switch (ip_ver) {
773 case 4:
774 listen4 = (struct sockaddr_in *) &listen_addr->src_addr;
775 ip4 = (struct sockaddr_in *) &addr->src_addr;
776 ip4->sin_family = listen4->sin_family;
777 ip4->sin_addr.s_addr = dst->ip4.addr;
778 ip4->sin_port = listen4->sin_port;
779
780 ip4 = (struct sockaddr_in *) &addr->dst_addr;
781 ip4->sin_family = listen4->sin_family;
782 ip4->sin_addr.s_addr = src->ip4.addr;
783 ip4->sin_port = port;
784 break;
785 case 6:
786 listen6 = (struct sockaddr_in6 *) &listen_addr->src_addr;
787 ip6 = (struct sockaddr_in6 *) &addr->src_addr;
788 ip6->sin6_family = listen6->sin6_family;
789 ip6->sin6_addr = dst->ip6;
790 ip6->sin6_port = listen6->sin6_port;
791
792 ip6 = (struct sockaddr_in6 *) &addr->dst_addr;
793 ip6->sin6_family = listen6->sin6_family;
794 ip6->sin6_addr = src->ip6;
795 ip6->sin6_port = port;
796 break;
797 default:
798 break;
799 }
800}
801
802static inline int cma_user_data_offset(enum rdma_port_space ps)
803{
804 switch (ps) {
805 case RDMA_PS_SDP:
806 return 0;
807 default:
808 return sizeof(struct cma_hdr);
809 }
810}
811
e51060f0
SH
812static void cma_cancel_route(struct rdma_id_private *id_priv)
813{
3c86aa70
EC
814 switch (rdma_port_get_link_layer(id_priv->id.device, id_priv->id.port_num)) {
815 case IB_LINK_LAYER_INFINIBAND:
e51060f0
SH
816 if (id_priv->query)
817 ib_sa_cancel_query(id_priv->query_id, id_priv->query);
818 break;
819 default:
820 break;
821 }
822}
823
e51060f0
SH
824static void cma_cancel_listens(struct rdma_id_private *id_priv)
825{
826 struct rdma_id_private *dev_id_priv;
827
d02d1f53
SH
828 /*
829 * Remove from listen_any_list to prevent added devices from spawning
830 * additional listen requests.
831 */
e51060f0
SH
832 mutex_lock(&lock);
833 list_del(&id_priv->list);
834
835 while (!list_empty(&id_priv->listen_list)) {
836 dev_id_priv = list_entry(id_priv->listen_list.next,
837 struct rdma_id_private, listen_list);
d02d1f53
SH
838 /* sync with device removal to avoid duplicate destruction */
839 list_del_init(&dev_id_priv->list);
840 list_del(&dev_id_priv->listen_list);
841 mutex_unlock(&lock);
842
843 rdma_destroy_id(&dev_id_priv->id);
844 mutex_lock(&lock);
e51060f0
SH
845 }
846 mutex_unlock(&lock);
847}
848
849static void cma_cancel_operation(struct rdma_id_private *id_priv,
550e5ca7 850 enum rdma_cm_state state)
e51060f0
SH
851{
852 switch (state) {
550e5ca7 853 case RDMA_CM_ADDR_QUERY:
e51060f0
SH
854 rdma_addr_cancel(&id_priv->id.route.addr.dev_addr);
855 break;
550e5ca7 856 case RDMA_CM_ROUTE_QUERY:
e51060f0
SH
857 cma_cancel_route(id_priv);
858 break;
550e5ca7 859 case RDMA_CM_LISTEN:
3f446754
RD
860 if (cma_any_addr((struct sockaddr *) &id_priv->id.route.addr.src_addr)
861 && !id_priv->cma_dev)
e51060f0
SH
862 cma_cancel_listens(id_priv);
863 break;
864 default:
865 break;
866 }
867}
868
869static void cma_release_port(struct rdma_id_private *id_priv)
870{
871 struct rdma_bind_list *bind_list = id_priv->bind_list;
872
873 if (!bind_list)
874 return;
875
876 mutex_lock(&lock);
877 hlist_del(&id_priv->node);
878 if (hlist_empty(&bind_list->owners)) {
879 idr_remove(bind_list->ps, bind_list->port);
880 kfree(bind_list);
881 }
882 mutex_unlock(&lock);
883}
884
c8f6a362
SH
885static void cma_leave_mc_groups(struct rdma_id_private *id_priv)
886{
887 struct cma_multicast *mc;
888
889 while (!list_empty(&id_priv->mc_list)) {
890 mc = container_of(id_priv->mc_list.next,
891 struct cma_multicast, list);
892 list_del(&mc->list);
3c86aa70
EC
893 switch (rdma_port_get_link_layer(id_priv->cma_dev->device, id_priv->id.port_num)) {
894 case IB_LINK_LAYER_INFINIBAND:
895 ib_sa_free_multicast(mc->multicast.ib);
896 kfree(mc);
897 break;
898 case IB_LINK_LAYER_ETHERNET:
899 kref_put(&mc->mcref, release_mc);
900 break;
901 default:
902 break;
903 }
c8f6a362
SH
904 }
905}
906
e51060f0
SH
907void rdma_destroy_id(struct rdma_cm_id *id)
908{
909 struct rdma_id_private *id_priv;
550e5ca7 910 enum rdma_cm_state state;
e51060f0
SH
911
912 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 913 state = cma_exch(id_priv, RDMA_CM_DESTROYING);
e51060f0
SH
914 cma_cancel_operation(id_priv, state);
915
a396d43a
SH
916 /*
917 * Wait for any active callback to finish. New callbacks will find
918 * the id_priv state set to destroying and abort.
919 */
920 mutex_lock(&id_priv->handler_mutex);
921 mutex_unlock(&id_priv->handler_mutex);
922
e51060f0 923 if (id_priv->cma_dev) {
3c86aa70 924 switch (rdma_node_get_transport(id_priv->id.device->node_type)) {
07ebafba 925 case RDMA_TRANSPORT_IB:
0c9361fc 926 if (id_priv->cm_id.ib)
e51060f0
SH
927 ib_destroy_cm_id(id_priv->cm_id.ib);
928 break;
07ebafba 929 case RDMA_TRANSPORT_IWARP:
0c9361fc 930 if (id_priv->cm_id.iw)
07ebafba
TT
931 iw_destroy_cm_id(id_priv->cm_id.iw);
932 break;
e51060f0
SH
933 default:
934 break;
935 }
c8f6a362 936 cma_leave_mc_groups(id_priv);
a396d43a 937 cma_release_dev(id_priv);
e51060f0
SH
938 }
939
940 cma_release_port(id_priv);
941 cma_deref_id(id_priv);
942 wait_for_completion(&id_priv->comp);
943
d02d1f53
SH
944 if (id_priv->internal_id)
945 cma_deref_id(id_priv->id.context);
946
e51060f0
SH
947 kfree(id_priv->id.route.path_rec);
948 kfree(id_priv);
949}
950EXPORT_SYMBOL(rdma_destroy_id);
951
952static int cma_rep_recv(struct rdma_id_private *id_priv)
953{
954 int ret;
955
5851bb89 956 ret = cma_modify_qp_rtr(id_priv, NULL);
e51060f0
SH
957 if (ret)
958 goto reject;
959
5851bb89 960 ret = cma_modify_qp_rts(id_priv, NULL);
e51060f0
SH
961 if (ret)
962 goto reject;
963
964 ret = ib_send_cm_rtu(id_priv->cm_id.ib, NULL, 0);
965 if (ret)
966 goto reject;
967
968 return 0;
969reject:
c5483388 970 cma_modify_qp_err(id_priv);
e51060f0
SH
971 ib_send_cm_rej(id_priv->cm_id.ib, IB_CM_REJ_CONSUMER_DEFINED,
972 NULL, 0, NULL, 0);
973 return ret;
974}
975
976static int cma_verify_rep(struct rdma_id_private *id_priv, void *data)
977{
978 if (id_priv->id.ps == RDMA_PS_SDP &&
979 sdp_get_majv(((struct sdp_hah *) data)->sdp_version) !=
980 SDP_MAJ_VERSION)
981 return -EINVAL;
982
983 return 0;
984}
985
a1b1b61f
SH
986static void cma_set_rep_event_data(struct rdma_cm_event *event,
987 struct ib_cm_rep_event_param *rep_data,
988 void *private_data)
989{
990 event->param.conn.private_data = private_data;
991 event->param.conn.private_data_len = IB_CM_REP_PRIVATE_DATA_SIZE;
992 event->param.conn.responder_resources = rep_data->responder_resources;
993 event->param.conn.initiator_depth = rep_data->initiator_depth;
994 event->param.conn.flow_control = rep_data->flow_control;
995 event->param.conn.rnr_retry_count = rep_data->rnr_retry_count;
996 event->param.conn.srq = rep_data->srq;
997 event->param.conn.qp_num = rep_data->remote_qpn;
998}
999
e51060f0
SH
1000static int cma_ib_handler(struct ib_cm_id *cm_id, struct ib_cm_event *ib_event)
1001{
1002 struct rdma_id_private *id_priv = cm_id->context;
a1b1b61f
SH
1003 struct rdma_cm_event event;
1004 int ret = 0;
e51060f0 1005
38ca83a5 1006 if ((ib_event->event != IB_CM_TIMEWAIT_EXIT &&
550e5ca7 1007 cma_disable_callback(id_priv, RDMA_CM_CONNECT)) ||
38ca83a5 1008 (ib_event->event == IB_CM_TIMEWAIT_EXIT &&
550e5ca7 1009 cma_disable_callback(id_priv, RDMA_CM_DISCONNECT)))
8aa08602 1010 return 0;
e51060f0 1011
a1b1b61f 1012 memset(&event, 0, sizeof event);
e51060f0
SH
1013 switch (ib_event->event) {
1014 case IB_CM_REQ_ERROR:
1015 case IB_CM_REP_ERROR:
a1b1b61f
SH
1016 event.event = RDMA_CM_EVENT_UNREACHABLE;
1017 event.status = -ETIMEDOUT;
e51060f0
SH
1018 break;
1019 case IB_CM_REP_RECEIVED:
a1b1b61f
SH
1020 event.status = cma_verify_rep(id_priv, ib_event->private_data);
1021 if (event.status)
1022 event.event = RDMA_CM_EVENT_CONNECT_ERROR;
e51060f0 1023 else if (id_priv->id.qp && id_priv->id.ps != RDMA_PS_SDP) {
a1b1b61f
SH
1024 event.status = cma_rep_recv(id_priv);
1025 event.event = event.status ? RDMA_CM_EVENT_CONNECT_ERROR :
1026 RDMA_CM_EVENT_ESTABLISHED;
e51060f0 1027 } else
a1b1b61f
SH
1028 event.event = RDMA_CM_EVENT_CONNECT_RESPONSE;
1029 cma_set_rep_event_data(&event, &ib_event->param.rep_rcvd,
1030 ib_event->private_data);
e51060f0
SH
1031 break;
1032 case IB_CM_RTU_RECEIVED:
0fe313b0
SH
1033 case IB_CM_USER_ESTABLISHED:
1034 event.event = RDMA_CM_EVENT_ESTABLISHED;
e51060f0
SH
1035 break;
1036 case IB_CM_DREQ_ERROR:
a1b1b61f 1037 event.status = -ETIMEDOUT; /* fall through */
e51060f0
SH
1038 case IB_CM_DREQ_RECEIVED:
1039 case IB_CM_DREP_RECEIVED:
550e5ca7
NM
1040 if (!cma_comp_exch(id_priv, RDMA_CM_CONNECT,
1041 RDMA_CM_DISCONNECT))
e51060f0 1042 goto out;
a1b1b61f 1043 event.event = RDMA_CM_EVENT_DISCONNECTED;
e51060f0
SH
1044 break;
1045 case IB_CM_TIMEWAIT_EXIT:
38ca83a5
AV
1046 event.event = RDMA_CM_EVENT_TIMEWAIT_EXIT;
1047 break;
e51060f0
SH
1048 case IB_CM_MRA_RECEIVED:
1049 /* ignore event */
1050 goto out;
1051 case IB_CM_REJ_RECEIVED:
c5483388 1052 cma_modify_qp_err(id_priv);
a1b1b61f
SH
1053 event.status = ib_event->param.rej_rcvd.reason;
1054 event.event = RDMA_CM_EVENT_REJECTED;
1055 event.param.conn.private_data = ib_event->private_data;
1056 event.param.conn.private_data_len = IB_CM_REJ_PRIVATE_DATA_SIZE;
e51060f0
SH
1057 break;
1058 default:
468f2239 1059 printk(KERN_ERR "RDMA CMA: unexpected IB CM event: %d\n",
e51060f0
SH
1060 ib_event->event);
1061 goto out;
1062 }
1063
a1b1b61f 1064 ret = id_priv->id.event_handler(&id_priv->id, &event);
e51060f0
SH
1065 if (ret) {
1066 /* Destroy the CM ID by returning a non-zero value. */
1067 id_priv->cm_id.ib = NULL;
550e5ca7 1068 cma_exch(id_priv, RDMA_CM_DESTROYING);
de910bd9 1069 mutex_unlock(&id_priv->handler_mutex);
e51060f0
SH
1070 rdma_destroy_id(&id_priv->id);
1071 return ret;
1072 }
1073out:
de910bd9 1074 mutex_unlock(&id_priv->handler_mutex);
e51060f0
SH
1075 return ret;
1076}
1077
628e5f6d
SH
1078static struct rdma_id_private *cma_new_conn_id(struct rdma_cm_id *listen_id,
1079 struct ib_cm_event *ib_event)
e51060f0
SH
1080{
1081 struct rdma_id_private *id_priv;
1082 struct rdma_cm_id *id;
1083 struct rdma_route *rt;
1084 union cma_ip_addr *src, *dst;
1b90c137 1085 __be16 port;
e51060f0 1086 u8 ip_ver;
64c5e613 1087 int ret;
e51060f0 1088
3f168d2b
KK
1089 if (cma_get_net_info(ib_event->private_data, listen_id->ps,
1090 &ip_ver, &port, &src, &dst))
0c9361fc 1091 return NULL;
3f168d2b 1092
e51060f0 1093 id = rdma_create_id(listen_id->event_handler, listen_id->context,
b26f9b99 1094 listen_id->ps, ib_event->param.req_rcvd.qp_type);
e51060f0 1095 if (IS_ERR(id))
0c9361fc 1096 return NULL;
3f168d2b
KK
1097
1098 cma_save_net_info(&id->route.addr, &listen_id->route.addr,
1099 ip_ver, port, src, dst);
e51060f0
SH
1100
1101 rt = &id->route;
1102 rt->num_paths = ib_event->param.req_rcvd.alternate_path ? 2 : 1;
3f168d2b
KK
1103 rt->path_rec = kmalloc(sizeof *rt->path_rec * rt->num_paths,
1104 GFP_KERNEL);
e51060f0 1105 if (!rt->path_rec)
0c9361fc 1106 goto err;
e51060f0 1107
e51060f0
SH
1108 rt->path_rec[0] = *ib_event->param.req_rcvd.primary_path;
1109 if (rt->num_paths == 2)
1110 rt->path_rec[1] = *ib_event->param.req_rcvd.alternate_path;
1111
6f8372b6
SH
1112 if (cma_any_addr((struct sockaddr *) &rt->addr.src_addr)) {
1113 rt->addr.dev_addr.dev_type = ARPHRD_INFINIBAND;
1114 rdma_addr_set_sgid(&rt->addr.dev_addr, &rt->path_rec[0].sgid);
46ea5061 1115 ib_addr_set_pkey(&rt->addr.dev_addr, be16_to_cpu(rt->path_rec[0].pkey));
6f8372b6
SH
1116 } else {
1117 ret = rdma_translate_ip((struct sockaddr *) &rt->addr.src_addr,
1118 &rt->addr.dev_addr);
1119 if (ret)
0c9361fc 1120 goto err;
6f8372b6
SH
1121 }
1122 rdma_addr_set_dgid(&rt->addr.dev_addr, &rt->path_rec[0].dgid);
e51060f0
SH
1123
1124 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 1125 id_priv->state = RDMA_CM_CONNECT;
e51060f0 1126 return id_priv;
3f168d2b 1127
3f168d2b 1128err:
0c9361fc 1129 rdma_destroy_id(id);
e51060f0
SH
1130 return NULL;
1131}
1132
628e5f6d
SH
1133static struct rdma_id_private *cma_new_udp_id(struct rdma_cm_id *listen_id,
1134 struct ib_cm_event *ib_event)
1135{
1136 struct rdma_id_private *id_priv;
1137 struct rdma_cm_id *id;
1138 union cma_ip_addr *src, *dst;
1b90c137 1139 __be16 port;
628e5f6d
SH
1140 u8 ip_ver;
1141 int ret;
1142
1143 id = rdma_create_id(listen_id->event_handler, listen_id->context,
b26f9b99 1144 listen_id->ps, IB_QPT_UD);
628e5f6d
SH
1145 if (IS_ERR(id))
1146 return NULL;
1147
1148
1149 if (cma_get_net_info(ib_event->private_data, listen_id->ps,
1150 &ip_ver, &port, &src, &dst))
1151 goto err;
1152
1153 cma_save_net_info(&id->route.addr, &listen_id->route.addr,
1154 ip_ver, port, src, dst);
1155
6f8372b6
SH
1156 if (!cma_any_addr((struct sockaddr *) &id->route.addr.src_addr)) {
1157 ret = rdma_translate_ip((struct sockaddr *) &id->route.addr.src_addr,
1158 &id->route.addr.dev_addr);
1159 if (ret)
1160 goto err;
1161 }
628e5f6d
SH
1162
1163 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 1164 id_priv->state = RDMA_CM_CONNECT;
628e5f6d
SH
1165 return id_priv;
1166err:
1167 rdma_destroy_id(id);
1168 return NULL;
1169}
1170
a1b1b61f
SH
1171static void cma_set_req_event_data(struct rdma_cm_event *event,
1172 struct ib_cm_req_event_param *req_data,
1173 void *private_data, int offset)
1174{
1175 event->param.conn.private_data = private_data + offset;
1176 event->param.conn.private_data_len = IB_CM_REQ_PRIVATE_DATA_SIZE - offset;
1177 event->param.conn.responder_resources = req_data->responder_resources;
1178 event->param.conn.initiator_depth = req_data->initiator_depth;
1179 event->param.conn.flow_control = req_data->flow_control;
1180 event->param.conn.retry_count = req_data->retry_count;
1181 event->param.conn.rnr_retry_count = req_data->rnr_retry_count;
1182 event->param.conn.srq = req_data->srq;
1183 event->param.conn.qp_num = req_data->remote_qpn;
1184}
1185
9595480c
HS
1186static int cma_check_req_qp_type(struct rdma_cm_id *id, struct ib_cm_event *ib_event)
1187{
4dd81e89 1188 return (((ib_event->event == IB_CM_REQ_RECEIVED) &&
9595480c
HS
1189 (ib_event->param.req_rcvd.qp_type == id->qp_type)) ||
1190 ((ib_event->event == IB_CM_SIDR_REQ_RECEIVED) &&
1191 (id->qp_type == IB_QPT_UD)) ||
1192 (!id->qp_type));
1193}
1194
e51060f0
SH
1195static int cma_req_handler(struct ib_cm_id *cm_id, struct ib_cm_event *ib_event)
1196{
1197 struct rdma_id_private *listen_id, *conn_id;
a1b1b61f 1198 struct rdma_cm_event event;
e51060f0
SH
1199 int offset, ret;
1200
1201 listen_id = cm_id->context;
9595480c
HS
1202 if (!cma_check_req_qp_type(&listen_id->id, ib_event))
1203 return -EINVAL;
1204
550e5ca7 1205 if (cma_disable_callback(listen_id, RDMA_CM_LISTEN))
8aa08602 1206 return -ECONNABORTED;
e51060f0 1207
628e5f6d
SH
1208 memset(&event, 0, sizeof event);
1209 offset = cma_user_data_offset(listen_id->id.ps);
1210 event.event = RDMA_CM_EVENT_CONNECT_REQUEST;
9595480c 1211 if (ib_event->event == IB_CM_SIDR_REQ_RECEIVED) {
628e5f6d
SH
1212 conn_id = cma_new_udp_id(&listen_id->id, ib_event);
1213 event.param.ud.private_data = ib_event->private_data + offset;
1214 event.param.ud.private_data_len =
1215 IB_CM_SIDR_REQ_PRIVATE_DATA_SIZE - offset;
1216 } else {
1217 conn_id = cma_new_conn_id(&listen_id->id, ib_event);
1218 cma_set_req_event_data(&event, &ib_event->param.req_rcvd,
1219 ib_event->private_data, offset);
1220 }
e51060f0
SH
1221 if (!conn_id) {
1222 ret = -ENOMEM;
b6cec8aa 1223 goto err1;
e51060f0
SH
1224 }
1225
de910bd9 1226 mutex_lock_nested(&conn_id->handler_mutex, SINGLE_DEPTH_NESTING);
07ebafba 1227 ret = cma_acquire_dev(conn_id);
a1a733f6 1228 if (ret)
b6cec8aa 1229 goto err2;
e51060f0
SH
1230
1231 conn_id->cm_id.ib = cm_id;
1232 cm_id->context = conn_id;
1233 cm_id->cm_handler = cma_ib_handler;
1234
25ae21a1
SH
1235 /*
1236 * Protect against the user destroying conn_id from another thread
1237 * until we're done accessing it.
1238 */
1239 atomic_inc(&conn_id->refcount);
a1b1b61f 1240 ret = conn_id->id.event_handler(&conn_id->id, &event);
b6cec8aa
SH
1241 if (ret)
1242 goto err3;
1243
1244 /*
1245 * Acquire mutex to prevent user executing rdma_destroy_id()
1246 * while we're accessing the cm_id.
1247 */
1248 mutex_lock(&lock);
1249 if (cma_comp(conn_id, RDMA_CM_CONNECT) && (conn_id->id.qp_type != IB_QPT_UD))
1250 ib_send_cm_mra(cm_id, CMA_CM_MRA_SETTING, NULL, 0);
1251 mutex_unlock(&lock);
1252 mutex_unlock(&conn_id->handler_mutex);
1253 mutex_unlock(&listen_id->handler_mutex);
25ae21a1 1254 cma_deref_id(conn_id);
b6cec8aa 1255 return 0;
a1a733f6 1256
b6cec8aa
SH
1257err3:
1258 cma_deref_id(conn_id);
a1a733f6
KK
1259 /* Destroy the CM ID by returning a non-zero value. */
1260 conn_id->cm_id.ib = NULL;
b6cec8aa 1261err2:
550e5ca7 1262 cma_exch(conn_id, RDMA_CM_DESTROYING);
de910bd9 1263 mutex_unlock(&conn_id->handler_mutex);
b6cec8aa 1264err1:
de910bd9 1265 mutex_unlock(&listen_id->handler_mutex);
b6cec8aa
SH
1266 if (conn_id)
1267 rdma_destroy_id(&conn_id->id);
e51060f0
SH
1268 return ret;
1269}
1270
1271static __be64 cma_get_service_id(enum rdma_port_space ps, struct sockaddr *addr)
1272{
628e5f6d 1273 return cpu_to_be64(((u64)ps << 16) + be16_to_cpu(cma_port(addr)));
e51060f0
SH
1274}
1275
1276static void cma_set_compare_data(enum rdma_port_space ps, struct sockaddr *addr,
1277 struct ib_cm_compare_data *compare)
1278{
1279 struct cma_hdr *cma_data, *cma_mask;
1280 struct sdp_hh *sdp_data, *sdp_mask;
1b90c137 1281 __be32 ip4_addr;
e51060f0
SH
1282 struct in6_addr ip6_addr;
1283
1284 memset(compare, 0, sizeof *compare);
1285 cma_data = (void *) compare->data;
1286 cma_mask = (void *) compare->mask;
1287 sdp_data = (void *) compare->data;
1288 sdp_mask = (void *) compare->mask;
1289
1290 switch (addr->sa_family) {
1291 case AF_INET:
1292 ip4_addr = ((struct sockaddr_in *) addr)->sin_addr.s_addr;
1293 if (ps == RDMA_PS_SDP) {
1294 sdp_set_ip_ver(sdp_data, 4);
1295 sdp_set_ip_ver(sdp_mask, 0xF);
1296 sdp_data->dst_addr.ip4.addr = ip4_addr;
1b90c137 1297 sdp_mask->dst_addr.ip4.addr = htonl(~0);
e51060f0
SH
1298 } else {
1299 cma_set_ip_ver(cma_data, 4);
1300 cma_set_ip_ver(cma_mask, 0xF);
406b6a25
SH
1301 if (!cma_any_addr(addr)) {
1302 cma_data->dst_addr.ip4.addr = ip4_addr;
1303 cma_mask->dst_addr.ip4.addr = htonl(~0);
1304 }
e51060f0
SH
1305 }
1306 break;
1307 case AF_INET6:
1308 ip6_addr = ((struct sockaddr_in6 *) addr)->sin6_addr;
1309 if (ps == RDMA_PS_SDP) {
1310 sdp_set_ip_ver(sdp_data, 6);
1311 sdp_set_ip_ver(sdp_mask, 0xF);
1312 sdp_data->dst_addr.ip6 = ip6_addr;
1313 memset(&sdp_mask->dst_addr.ip6, 0xFF,
1314 sizeof sdp_mask->dst_addr.ip6);
1315 } else {
1316 cma_set_ip_ver(cma_data, 6);
1317 cma_set_ip_ver(cma_mask, 0xF);
406b6a25
SH
1318 if (!cma_any_addr(addr)) {
1319 cma_data->dst_addr.ip6 = ip6_addr;
1320 memset(&cma_mask->dst_addr.ip6, 0xFF,
1321 sizeof cma_mask->dst_addr.ip6);
1322 }
e51060f0
SH
1323 }
1324 break;
1325 default:
1326 break;
1327 }
1328}
1329
07ebafba
TT
1330static int cma_iw_handler(struct iw_cm_id *iw_id, struct iw_cm_event *iw_event)
1331{
1332 struct rdma_id_private *id_priv = iw_id->context;
a1b1b61f 1333 struct rdma_cm_event event;
07ebafba
TT
1334 struct sockaddr_in *sin;
1335 int ret = 0;
1336
550e5ca7 1337 if (cma_disable_callback(id_priv, RDMA_CM_CONNECT))
be65f086 1338 return 0;
07ebafba 1339
be65f086 1340 memset(&event, 0, sizeof event);
07ebafba
TT
1341 switch (iw_event->event) {
1342 case IW_CM_EVENT_CLOSE:
a1b1b61f 1343 event.event = RDMA_CM_EVENT_DISCONNECTED;
07ebafba
TT
1344 break;
1345 case IW_CM_EVENT_CONNECT_REPLY:
1346 sin = (struct sockaddr_in *) &id_priv->id.route.addr.src_addr;
1347 *sin = iw_event->local_addr;
1348 sin = (struct sockaddr_in *) &id_priv->id.route.addr.dst_addr;
1349 *sin = iw_event->remote_addr;
881a045f
SW
1350 switch (iw_event->status) {
1351 case 0:
a1b1b61f 1352 event.event = RDMA_CM_EVENT_ESTABLISHED;
3ebeebc3
KS
1353 event.param.conn.initiator_depth = iw_event->ird;
1354 event.param.conn.responder_resources = iw_event->ord;
881a045f
SW
1355 break;
1356 case -ECONNRESET:
1357 case -ECONNREFUSED:
1358 event.event = RDMA_CM_EVENT_REJECTED;
1359 break;
1360 case -ETIMEDOUT:
1361 event.event = RDMA_CM_EVENT_UNREACHABLE;
1362 break;
1363 default:
1364 event.event = RDMA_CM_EVENT_CONNECT_ERROR;
1365 break;
1366 }
07ebafba
TT
1367 break;
1368 case IW_CM_EVENT_ESTABLISHED:
a1b1b61f 1369 event.event = RDMA_CM_EVENT_ESTABLISHED;
3ebeebc3
KS
1370 event.param.conn.initiator_depth = iw_event->ird;
1371 event.param.conn.responder_resources = iw_event->ord;
07ebafba
TT
1372 break;
1373 default:
1374 BUG_ON(1);
1375 }
1376
a1b1b61f
SH
1377 event.status = iw_event->status;
1378 event.param.conn.private_data = iw_event->private_data;
1379 event.param.conn.private_data_len = iw_event->private_data_len;
1380 ret = id_priv->id.event_handler(&id_priv->id, &event);
07ebafba
TT
1381 if (ret) {
1382 /* Destroy the CM ID by returning a non-zero value. */
1383 id_priv->cm_id.iw = NULL;
550e5ca7 1384 cma_exch(id_priv, RDMA_CM_DESTROYING);
de910bd9 1385 mutex_unlock(&id_priv->handler_mutex);
07ebafba
TT
1386 rdma_destroy_id(&id_priv->id);
1387 return ret;
1388 }
1389
de910bd9 1390 mutex_unlock(&id_priv->handler_mutex);
07ebafba
TT
1391 return ret;
1392}
1393
1394static int iw_conn_req_handler(struct iw_cm_id *cm_id,
1395 struct iw_cm_event *iw_event)
1396{
1397 struct rdma_cm_id *new_cm_id;
1398 struct rdma_id_private *listen_id, *conn_id;
1399 struct sockaddr_in *sin;
1400 struct net_device *dev = NULL;
a1b1b61f 1401 struct rdma_cm_event event;
07ebafba 1402 int ret;
8d8293cf 1403 struct ib_device_attr attr;
07ebafba
TT
1404
1405 listen_id = cm_id->context;
550e5ca7 1406 if (cma_disable_callback(listen_id, RDMA_CM_LISTEN))
8aa08602 1407 return -ECONNABORTED;
07ebafba
TT
1408
1409 /* Create a new RDMA id for the new IW CM ID */
1410 new_cm_id = rdma_create_id(listen_id->id.event_handler,
1411 listen_id->id.context,
b26f9b99 1412 RDMA_PS_TCP, IB_QPT_RC);
10f32065 1413 if (IS_ERR(new_cm_id)) {
07ebafba
TT
1414 ret = -ENOMEM;
1415 goto out;
1416 }
1417 conn_id = container_of(new_cm_id, struct rdma_id_private, id);
de910bd9 1418 mutex_lock_nested(&conn_id->handler_mutex, SINGLE_DEPTH_NESTING);
550e5ca7 1419 conn_id->state = RDMA_CM_CONNECT;
07ebafba 1420
1ab35276 1421 dev = ip_dev_find(&init_net, iw_event->local_addr.sin_addr.s_addr);
07ebafba
TT
1422 if (!dev) {
1423 ret = -EADDRNOTAVAIL;
de910bd9 1424 mutex_unlock(&conn_id->handler_mutex);
07ebafba
TT
1425 rdma_destroy_id(new_cm_id);
1426 goto out;
1427 }
1428 ret = rdma_copy_addr(&conn_id->id.route.addr.dev_addr, dev, NULL);
1429 if (ret) {
de910bd9 1430 mutex_unlock(&conn_id->handler_mutex);
07ebafba
TT
1431 rdma_destroy_id(new_cm_id);
1432 goto out;
1433 }
1434
1435 ret = cma_acquire_dev(conn_id);
1436 if (ret) {
de910bd9 1437 mutex_unlock(&conn_id->handler_mutex);
07ebafba
TT
1438 rdma_destroy_id(new_cm_id);
1439 goto out;
1440 }
1441
1442 conn_id->cm_id.iw = cm_id;
1443 cm_id->context = conn_id;
1444 cm_id->cm_handler = cma_iw_handler;
1445
1446 sin = (struct sockaddr_in *) &new_cm_id->route.addr.src_addr;
1447 *sin = iw_event->local_addr;
1448 sin = (struct sockaddr_in *) &new_cm_id->route.addr.dst_addr;
1449 *sin = iw_event->remote_addr;
1450
8d8293cf
SW
1451 ret = ib_query_device(conn_id->id.device, &attr);
1452 if (ret) {
de910bd9 1453 mutex_unlock(&conn_id->handler_mutex);
8d8293cf
SW
1454 rdma_destroy_id(new_cm_id);
1455 goto out;
1456 }
1457
a1b1b61f
SH
1458 memset(&event, 0, sizeof event);
1459 event.event = RDMA_CM_EVENT_CONNECT_REQUEST;
1460 event.param.conn.private_data = iw_event->private_data;
1461 event.param.conn.private_data_len = iw_event->private_data_len;
3ebeebc3
KS
1462 event.param.conn.initiator_depth = iw_event->ird;
1463 event.param.conn.responder_resources = iw_event->ord;
25ae21a1
SH
1464
1465 /*
1466 * Protect against the user destroying conn_id from another thread
1467 * until we're done accessing it.
1468 */
1469 atomic_inc(&conn_id->refcount);
a1b1b61f 1470 ret = conn_id->id.event_handler(&conn_id->id, &event);
07ebafba
TT
1471 if (ret) {
1472 /* User wants to destroy the CM ID */
1473 conn_id->cm_id.iw = NULL;
550e5ca7 1474 cma_exch(conn_id, RDMA_CM_DESTROYING);
de910bd9 1475 mutex_unlock(&conn_id->handler_mutex);
25ae21a1 1476 cma_deref_id(conn_id);
07ebafba 1477 rdma_destroy_id(&conn_id->id);
de910bd9 1478 goto out;
07ebafba
TT
1479 }
1480
de910bd9 1481 mutex_unlock(&conn_id->handler_mutex);
25ae21a1 1482 cma_deref_id(conn_id);
de910bd9 1483
07ebafba
TT
1484out:
1485 if (dev)
1486 dev_put(dev);
de910bd9 1487 mutex_unlock(&listen_id->handler_mutex);
07ebafba
TT
1488 return ret;
1489}
1490
e51060f0
SH
1491static int cma_ib_listen(struct rdma_id_private *id_priv)
1492{
1493 struct ib_cm_compare_data compare_data;
1494 struct sockaddr *addr;
0c9361fc 1495 struct ib_cm_id *id;
e51060f0
SH
1496 __be64 svc_id;
1497 int ret;
1498
0c9361fc
JM
1499 id = ib_create_cm_id(id_priv->id.device, cma_req_handler, id_priv);
1500 if (IS_ERR(id))
1501 return PTR_ERR(id);
1502
1503 id_priv->cm_id.ib = id;
e51060f0 1504
3f446754 1505 addr = (struct sockaddr *) &id_priv->id.route.addr.src_addr;
e51060f0 1506 svc_id = cma_get_service_id(id_priv->id.ps, addr);
406b6a25 1507 if (cma_any_addr(addr) && !id_priv->afonly)
e51060f0
SH
1508 ret = ib_cm_listen(id_priv->cm_id.ib, svc_id, 0, NULL);
1509 else {
1510 cma_set_compare_data(id_priv->id.ps, addr, &compare_data);
1511 ret = ib_cm_listen(id_priv->cm_id.ib, svc_id, 0, &compare_data);
1512 }
1513
1514 if (ret) {
1515 ib_destroy_cm_id(id_priv->cm_id.ib);
1516 id_priv->cm_id.ib = NULL;
1517 }
1518
1519 return ret;
1520}
1521
07ebafba
TT
1522static int cma_iw_listen(struct rdma_id_private *id_priv, int backlog)
1523{
1524 int ret;
1525 struct sockaddr_in *sin;
0c9361fc
JM
1526 struct iw_cm_id *id;
1527
1528 id = iw_create_cm_id(id_priv->id.device,
1529 iw_conn_req_handler,
1530 id_priv);
1531 if (IS_ERR(id))
1532 return PTR_ERR(id);
07ebafba 1533
0c9361fc 1534 id_priv->cm_id.iw = id;
07ebafba
TT
1535
1536 sin = (struct sockaddr_in *) &id_priv->id.route.addr.src_addr;
1537 id_priv->cm_id.iw->local_addr = *sin;
1538
1539 ret = iw_cm_listen(id_priv->cm_id.iw, backlog);
1540
1541 if (ret) {
1542 iw_destroy_cm_id(id_priv->cm_id.iw);
1543 id_priv->cm_id.iw = NULL;
1544 }
1545
1546 return ret;
1547}
1548
e51060f0
SH
1549static int cma_listen_handler(struct rdma_cm_id *id,
1550 struct rdma_cm_event *event)
1551{
1552 struct rdma_id_private *id_priv = id->context;
1553
1554 id->context = id_priv->id.context;
1555 id->event_handler = id_priv->id.event_handler;
1556 return id_priv->id.event_handler(id, event);
1557}
1558
1559static void cma_listen_on_dev(struct rdma_id_private *id_priv,
1560 struct cma_device *cma_dev)
1561{
1562 struct rdma_id_private *dev_id_priv;
1563 struct rdma_cm_id *id;
1564 int ret;
1565
b26f9b99
SH
1566 id = rdma_create_id(cma_listen_handler, id_priv, id_priv->id.ps,
1567 id_priv->id.qp_type);
e51060f0
SH
1568 if (IS_ERR(id))
1569 return;
1570
1571 dev_id_priv = container_of(id, struct rdma_id_private, id);
1572
550e5ca7 1573 dev_id_priv->state = RDMA_CM_ADDR_BOUND;
e51060f0 1574 memcpy(&id->route.addr.src_addr, &id_priv->id.route.addr.src_addr,
3f446754 1575 ip_addr_size((struct sockaddr *) &id_priv->id.route.addr.src_addr));
e51060f0
SH
1576
1577 cma_attach_to_dev(dev_id_priv, cma_dev);
1578 list_add_tail(&dev_id_priv->listen_list, &id_priv->listen_list);
d02d1f53
SH
1579 atomic_inc(&id_priv->refcount);
1580 dev_id_priv->internal_id = 1;
5b0ec991 1581 dev_id_priv->afonly = id_priv->afonly;
e51060f0
SH
1582
1583 ret = rdma_listen(id, id_priv->backlog);
1584 if (ret)
d02d1f53 1585 printk(KERN_WARNING "RDMA CMA: cma_listen_on_dev, error %d, "
468f2239 1586 "listening on device %s\n", ret, cma_dev->device->name);
e51060f0
SH
1587}
1588
1589static void cma_listen_on_all(struct rdma_id_private *id_priv)
1590{
1591 struct cma_device *cma_dev;
1592
1593 mutex_lock(&lock);
1594 list_add_tail(&id_priv->list, &listen_any_list);
1595 list_for_each_entry(cma_dev, &dev_list, list)
1596 cma_listen_on_dev(id_priv, cma_dev);
1597 mutex_unlock(&lock);
1598}
1599
a81c994d
SH
1600void rdma_set_service_type(struct rdma_cm_id *id, int tos)
1601{
1602 struct rdma_id_private *id_priv;
1603
1604 id_priv = container_of(id, struct rdma_id_private, id);
1605 id_priv->tos = (u8) tos;
1606}
1607EXPORT_SYMBOL(rdma_set_service_type);
1608
e51060f0
SH
1609static void cma_query_handler(int status, struct ib_sa_path_rec *path_rec,
1610 void *context)
1611{
1612 struct cma_work *work = context;
1613 struct rdma_route *route;
1614
1615 route = &work->id->id.route;
1616
1617 if (!status) {
1618 route->num_paths = 1;
1619 *route->path_rec = *path_rec;
1620 } else {
550e5ca7
NM
1621 work->old_state = RDMA_CM_ROUTE_QUERY;
1622 work->new_state = RDMA_CM_ADDR_RESOLVED;
e51060f0 1623 work->event.event = RDMA_CM_EVENT_ROUTE_ERROR;
8f0472d3 1624 work->event.status = status;
e51060f0
SH
1625 }
1626
1627 queue_work(cma_wq, &work->work);
1628}
1629
1630static int cma_query_ib_route(struct rdma_id_private *id_priv, int timeout_ms,
1631 struct cma_work *work)
1632{
a81c994d 1633 struct rdma_addr *addr = &id_priv->id.route.addr;
e51060f0 1634 struct ib_sa_path_rec path_rec;
a81c994d
SH
1635 ib_sa_comp_mask comp_mask;
1636 struct sockaddr_in6 *sin6;
e51060f0
SH
1637
1638 memset(&path_rec, 0, sizeof path_rec);
6f8372b6
SH
1639 rdma_addr_get_sgid(&addr->dev_addr, &path_rec.sgid);
1640 rdma_addr_get_dgid(&addr->dev_addr, &path_rec.dgid);
a81c994d 1641 path_rec.pkey = cpu_to_be16(ib_addr_get_pkey(&addr->dev_addr));
e51060f0 1642 path_rec.numb_path = 1;
962063e6 1643 path_rec.reversible = 1;
3f446754
RD
1644 path_rec.service_id = cma_get_service_id(id_priv->id.ps,
1645 (struct sockaddr *) &addr->dst_addr);
a81c994d
SH
1646
1647 comp_mask = IB_SA_PATH_REC_DGID | IB_SA_PATH_REC_SGID |
1648 IB_SA_PATH_REC_PKEY | IB_SA_PATH_REC_NUMB_PATH |
1649 IB_SA_PATH_REC_REVERSIBLE | IB_SA_PATH_REC_SERVICE_ID;
1650
3f446754 1651 if (addr->src_addr.ss_family == AF_INET) {
a81c994d
SH
1652 path_rec.qos_class = cpu_to_be16((u16) id_priv->tos);
1653 comp_mask |= IB_SA_PATH_REC_QOS_CLASS;
1654 } else {
1655 sin6 = (struct sockaddr_in6 *) &addr->src_addr;
1656 path_rec.traffic_class = (u8) (be32_to_cpu(sin6->sin6_flowinfo) >> 20);
1657 comp_mask |= IB_SA_PATH_REC_TRAFFIC_CLASS;
1658 }
e51060f0 1659
c1a0b23b 1660 id_priv->query_id = ib_sa_path_rec_get(&sa_client, id_priv->id.device,
a81c994d
SH
1661 id_priv->id.port_num, &path_rec,
1662 comp_mask, timeout_ms,
1663 GFP_KERNEL, cma_query_handler,
1664 work, &id_priv->query);
e51060f0
SH
1665
1666 return (id_priv->query_id < 0) ? id_priv->query_id : 0;
1667}
1668
c4028958 1669static void cma_work_handler(struct work_struct *_work)
e51060f0 1670{
c4028958 1671 struct cma_work *work = container_of(_work, struct cma_work, work);
e51060f0
SH
1672 struct rdma_id_private *id_priv = work->id;
1673 int destroy = 0;
1674
de910bd9 1675 mutex_lock(&id_priv->handler_mutex);
e51060f0
SH
1676 if (!cma_comp_exch(id_priv, work->old_state, work->new_state))
1677 goto out;
1678
1679 if (id_priv->id.event_handler(&id_priv->id, &work->event)) {
550e5ca7 1680 cma_exch(id_priv, RDMA_CM_DESTROYING);
e51060f0
SH
1681 destroy = 1;
1682 }
1683out:
de910bd9 1684 mutex_unlock(&id_priv->handler_mutex);
e51060f0
SH
1685 cma_deref_id(id_priv);
1686 if (destroy)
1687 rdma_destroy_id(&id_priv->id);
1688 kfree(work);
1689}
1690
dd5bdff8
OG
1691static void cma_ndev_work_handler(struct work_struct *_work)
1692{
1693 struct cma_ndev_work *work = container_of(_work, struct cma_ndev_work, work);
1694 struct rdma_id_private *id_priv = work->id;
1695 int destroy = 0;
1696
1697 mutex_lock(&id_priv->handler_mutex);
550e5ca7
NM
1698 if (id_priv->state == RDMA_CM_DESTROYING ||
1699 id_priv->state == RDMA_CM_DEVICE_REMOVAL)
dd5bdff8
OG
1700 goto out;
1701
1702 if (id_priv->id.event_handler(&id_priv->id, &work->event)) {
550e5ca7 1703 cma_exch(id_priv, RDMA_CM_DESTROYING);
dd5bdff8
OG
1704 destroy = 1;
1705 }
1706
1707out:
1708 mutex_unlock(&id_priv->handler_mutex);
1709 cma_deref_id(id_priv);
1710 if (destroy)
1711 rdma_destroy_id(&id_priv->id);
1712 kfree(work);
1713}
1714
e51060f0
SH
1715static int cma_resolve_ib_route(struct rdma_id_private *id_priv, int timeout_ms)
1716{
1717 struct rdma_route *route = &id_priv->id.route;
1718 struct cma_work *work;
1719 int ret;
1720
1721 work = kzalloc(sizeof *work, GFP_KERNEL);
1722 if (!work)
1723 return -ENOMEM;
1724
1725 work->id = id_priv;
c4028958 1726 INIT_WORK(&work->work, cma_work_handler);
550e5ca7
NM
1727 work->old_state = RDMA_CM_ROUTE_QUERY;
1728 work->new_state = RDMA_CM_ROUTE_RESOLVED;
e51060f0
SH
1729 work->event.event = RDMA_CM_EVENT_ROUTE_RESOLVED;
1730
1731 route->path_rec = kmalloc(sizeof *route->path_rec, GFP_KERNEL);
1732 if (!route->path_rec) {
1733 ret = -ENOMEM;
1734 goto err1;
1735 }
1736
1737 ret = cma_query_ib_route(id_priv, timeout_ms, work);
1738 if (ret)
1739 goto err2;
1740
1741 return 0;
1742err2:
1743 kfree(route->path_rec);
1744 route->path_rec = NULL;
1745err1:
1746 kfree(work);
1747 return ret;
1748}
1749
1750int rdma_set_ib_paths(struct rdma_cm_id *id,
1751 struct ib_sa_path_rec *path_rec, int num_paths)
1752{
1753 struct rdma_id_private *id_priv;
1754 int ret;
1755
1756 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7
NM
1757 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED,
1758 RDMA_CM_ROUTE_RESOLVED))
e51060f0
SH
1759 return -EINVAL;
1760
9893e742
JL
1761 id->route.path_rec = kmemdup(path_rec, sizeof *path_rec * num_paths,
1762 GFP_KERNEL);
e51060f0
SH
1763 if (!id->route.path_rec) {
1764 ret = -ENOMEM;
1765 goto err;
1766 }
1767
ae2d9293 1768 id->route.num_paths = num_paths;
e51060f0
SH
1769 return 0;
1770err:
550e5ca7 1771 cma_comp_exch(id_priv, RDMA_CM_ROUTE_RESOLVED, RDMA_CM_ADDR_RESOLVED);
e51060f0
SH
1772 return ret;
1773}
1774EXPORT_SYMBOL(rdma_set_ib_paths);
1775
07ebafba
TT
1776static int cma_resolve_iw_route(struct rdma_id_private *id_priv, int timeout_ms)
1777{
1778 struct cma_work *work;
1779
1780 work = kzalloc(sizeof *work, GFP_KERNEL);
1781 if (!work)
1782 return -ENOMEM;
1783
1784 work->id = id_priv;
c4028958 1785 INIT_WORK(&work->work, cma_work_handler);
550e5ca7
NM
1786 work->old_state = RDMA_CM_ROUTE_QUERY;
1787 work->new_state = RDMA_CM_ROUTE_RESOLVED;
07ebafba
TT
1788 work->event.event = RDMA_CM_EVENT_ROUTE_RESOLVED;
1789 queue_work(cma_wq, &work->work);
1790 return 0;
1791}
1792
3c86aa70
EC
1793static int cma_resolve_iboe_route(struct rdma_id_private *id_priv)
1794{
1795 struct rdma_route *route = &id_priv->id.route;
1796 struct rdma_addr *addr = &route->addr;
1797 struct cma_work *work;
1798 int ret;
1799 struct sockaddr_in *src_addr = (struct sockaddr_in *)&route->addr.src_addr;
1800 struct sockaddr_in *dst_addr = (struct sockaddr_in *)&route->addr.dst_addr;
1801 struct net_device *ndev = NULL;
af7bd463 1802 u16 vid;
3c86aa70
EC
1803
1804 if (src_addr->sin_family != dst_addr->sin_family)
1805 return -EINVAL;
1806
1807 work = kzalloc(sizeof *work, GFP_KERNEL);
1808 if (!work)
1809 return -ENOMEM;
1810
1811 work->id = id_priv;
1812 INIT_WORK(&work->work, cma_work_handler);
1813
1814 route->path_rec = kzalloc(sizeof *route->path_rec, GFP_KERNEL);
1815 if (!route->path_rec) {
1816 ret = -ENOMEM;
1817 goto err1;
1818 }
1819
1820 route->num_paths = 1;
1821
3c86aa70
EC
1822 if (addr->dev_addr.bound_dev_if)
1823 ndev = dev_get_by_index(&init_net, addr->dev_addr.bound_dev_if);
1824 if (!ndev) {
1825 ret = -ENODEV;
1826 goto err2;
1827 }
1828
af7bd463
EC
1829 vid = rdma_vlan_dev_vlan_id(ndev);
1830
1831 iboe_mac_vlan_to_ll(&route->path_rec->sgid, addr->dev_addr.src_dev_addr, vid);
1832 iboe_mac_vlan_to_ll(&route->path_rec->dgid, addr->dev_addr.dst_dev_addr, vid);
1833
1834 route->path_rec->hop_limit = 1;
1835 route->path_rec->reversible = 1;
1836 route->path_rec->pkey = cpu_to_be16(0xffff);
1837 route->path_rec->mtu_selector = IB_SA_EQ;
366cddb4
AV
1838 route->path_rec->sl = netdev_get_prio_tc_map(
1839 ndev->priv_flags & IFF_802_1Q_VLAN ?
1840 vlan_dev_real_dev(ndev) : ndev,
1841 rt_tos2priority(id_priv->tos));
af7bd463 1842
3c86aa70
EC
1843 route->path_rec->mtu = iboe_get_mtu(ndev->mtu);
1844 route->path_rec->rate_selector = IB_SA_EQ;
1845 route->path_rec->rate = iboe_get_rate(ndev);
1846 dev_put(ndev);
1847 route->path_rec->packet_life_time_selector = IB_SA_EQ;
1848 route->path_rec->packet_life_time = CMA_IBOE_PACKET_LIFETIME;
1849 if (!route->path_rec->mtu) {
1850 ret = -EINVAL;
1851 goto err2;
1852 }
1853
550e5ca7
NM
1854 work->old_state = RDMA_CM_ROUTE_QUERY;
1855 work->new_state = RDMA_CM_ROUTE_RESOLVED;
3c86aa70
EC
1856 work->event.event = RDMA_CM_EVENT_ROUTE_RESOLVED;
1857 work->event.status = 0;
1858
1859 queue_work(cma_wq, &work->work);
1860
1861 return 0;
1862
1863err2:
1864 kfree(route->path_rec);
1865 route->path_rec = NULL;
1866err1:
1867 kfree(work);
1868 return ret;
1869}
1870
e51060f0
SH
1871int rdma_resolve_route(struct rdma_cm_id *id, int timeout_ms)
1872{
1873 struct rdma_id_private *id_priv;
1874 int ret;
1875
1876 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 1877 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED, RDMA_CM_ROUTE_QUERY))
e51060f0
SH
1878 return -EINVAL;
1879
1880 atomic_inc(&id_priv->refcount);
07ebafba
TT
1881 switch (rdma_node_get_transport(id->device->node_type)) {
1882 case RDMA_TRANSPORT_IB:
3c86aa70
EC
1883 switch (rdma_port_get_link_layer(id->device, id->port_num)) {
1884 case IB_LINK_LAYER_INFINIBAND:
1885 ret = cma_resolve_ib_route(id_priv, timeout_ms);
1886 break;
1887 case IB_LINK_LAYER_ETHERNET:
1888 ret = cma_resolve_iboe_route(id_priv);
1889 break;
1890 default:
1891 ret = -ENOSYS;
1892 }
e51060f0 1893 break;
07ebafba
TT
1894 case RDMA_TRANSPORT_IWARP:
1895 ret = cma_resolve_iw_route(id_priv, timeout_ms);
1896 break;
e51060f0
SH
1897 default:
1898 ret = -ENOSYS;
1899 break;
1900 }
1901 if (ret)
1902 goto err;
1903
1904 return 0;
1905err:
550e5ca7 1906 cma_comp_exch(id_priv, RDMA_CM_ROUTE_QUERY, RDMA_CM_ADDR_RESOLVED);
e51060f0
SH
1907 cma_deref_id(id_priv);
1908 return ret;
1909}
1910EXPORT_SYMBOL(rdma_resolve_route);
1911
1912static int cma_bind_loopback(struct rdma_id_private *id_priv)
1913{
1914 struct cma_device *cma_dev;
1915 struct ib_port_attr port_attr;
f0ee3404 1916 union ib_gid gid;
e51060f0
SH
1917 u16 pkey;
1918 int ret;
1919 u8 p;
1920
1921 mutex_lock(&lock);
e82153b5
KK
1922 if (list_empty(&dev_list)) {
1923 ret = -ENODEV;
1924 goto out;
1925 }
e51060f0
SH
1926 list_for_each_entry(cma_dev, &dev_list, list)
1927 for (p = 1; p <= cma_dev->device->phys_port_cnt; ++p)
e82153b5 1928 if (!ib_query_port(cma_dev->device, p, &port_attr) &&
e51060f0
SH
1929 port_attr.state == IB_PORT_ACTIVE)
1930 goto port_found;
1931
e82153b5
KK
1932 p = 1;
1933 cma_dev = list_entry(dev_list.next, struct cma_device, list);
e51060f0
SH
1934
1935port_found:
f0ee3404 1936 ret = ib_get_cached_gid(cma_dev->device, p, 0, &gid);
e51060f0
SH
1937 if (ret)
1938 goto out;
1939
1940 ret = ib_get_cached_pkey(cma_dev->device, p, 0, &pkey);
1941 if (ret)
1942 goto out;
1943
6f8372b6 1944 id_priv->id.route.addr.dev_addr.dev_type =
3c86aa70 1945 (rdma_port_get_link_layer(cma_dev->device, p) == IB_LINK_LAYER_INFINIBAND) ?
6f8372b6
SH
1946 ARPHRD_INFINIBAND : ARPHRD_ETHER;
1947
1948 rdma_addr_set_sgid(&id_priv->id.route.addr.dev_addr, &gid);
e51060f0
SH
1949 ib_addr_set_pkey(&id_priv->id.route.addr.dev_addr, pkey);
1950 id_priv->id.port_num = p;
1951 cma_attach_to_dev(id_priv, cma_dev);
1952out:
1953 mutex_unlock(&lock);
1954 return ret;
1955}
1956
1957static void addr_handler(int status, struct sockaddr *src_addr,
1958 struct rdma_dev_addr *dev_addr, void *context)
1959{
1960 struct rdma_id_private *id_priv = context;
a1b1b61f 1961 struct rdma_cm_event event;
e51060f0 1962
a1b1b61f 1963 memset(&event, 0, sizeof event);
de910bd9 1964 mutex_lock(&id_priv->handler_mutex);
550e5ca7
NM
1965 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_QUERY,
1966 RDMA_CM_ADDR_RESOLVED))
61a73c70 1967 goto out;
61a73c70
SH
1968
1969 if (!status && !id_priv->cma_dev)
e51060f0
SH
1970 status = cma_acquire_dev(id_priv);
1971
1972 if (status) {
550e5ca7
NM
1973 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED,
1974 RDMA_CM_ADDR_BOUND))
e51060f0 1975 goto out;
a1b1b61f
SH
1976 event.event = RDMA_CM_EVENT_ADDR_ERROR;
1977 event.status = status;
e51060f0 1978 } else {
e51060f0
SH
1979 memcpy(&id_priv->id.route.addr.src_addr, src_addr,
1980 ip_addr_size(src_addr));
a1b1b61f 1981 event.event = RDMA_CM_EVENT_ADDR_RESOLVED;
e51060f0
SH
1982 }
1983
a1b1b61f 1984 if (id_priv->id.event_handler(&id_priv->id, &event)) {
550e5ca7 1985 cma_exch(id_priv, RDMA_CM_DESTROYING);
de910bd9 1986 mutex_unlock(&id_priv->handler_mutex);
e51060f0
SH
1987 cma_deref_id(id_priv);
1988 rdma_destroy_id(&id_priv->id);
1989 return;
1990 }
1991out:
de910bd9 1992 mutex_unlock(&id_priv->handler_mutex);
e51060f0
SH
1993 cma_deref_id(id_priv);
1994}
1995
1996static int cma_resolve_loopback(struct rdma_id_private *id_priv)
1997{
1998 struct cma_work *work;
6f8372b6 1999 struct sockaddr *src, *dst;
f0ee3404 2000 union ib_gid gid;
e51060f0
SH
2001 int ret;
2002
2003 work = kzalloc(sizeof *work, GFP_KERNEL);
2004 if (!work)
2005 return -ENOMEM;
2006
2007 if (!id_priv->cma_dev) {
2008 ret = cma_bind_loopback(id_priv);
2009 if (ret)
2010 goto err;
2011 }
2012
6f8372b6
SH
2013 rdma_addr_get_sgid(&id_priv->id.route.addr.dev_addr, &gid);
2014 rdma_addr_set_dgid(&id_priv->id.route.addr.dev_addr, &gid);
e51060f0 2015
6f8372b6
SH
2016 src = (struct sockaddr *) &id_priv->id.route.addr.src_addr;
2017 if (cma_zero_addr(src)) {
2018 dst = (struct sockaddr *) &id_priv->id.route.addr.dst_addr;
2019 if ((src->sa_family = dst->sa_family) == AF_INET) {
4e3fd7a0
AD
2020 ((struct sockaddr_in *)src)->sin_addr =
2021 ((struct sockaddr_in *)dst)->sin_addr;
6f8372b6 2022 } else {
4e3fd7a0
AD
2023 ((struct sockaddr_in6 *)src)->sin6_addr =
2024 ((struct sockaddr_in6 *)dst)->sin6_addr;
6f8372b6 2025 }
e51060f0
SH
2026 }
2027
2028 work->id = id_priv;
c4028958 2029 INIT_WORK(&work->work, cma_work_handler);
550e5ca7
NM
2030 work->old_state = RDMA_CM_ADDR_QUERY;
2031 work->new_state = RDMA_CM_ADDR_RESOLVED;
e51060f0
SH
2032 work->event.event = RDMA_CM_EVENT_ADDR_RESOLVED;
2033 queue_work(cma_wq, &work->work);
2034 return 0;
2035err:
2036 kfree(work);
2037 return ret;
2038}
2039
2040static int cma_bind_addr(struct rdma_cm_id *id, struct sockaddr *src_addr,
2041 struct sockaddr *dst_addr)
2042{
d14714df
SH
2043 if (!src_addr || !src_addr->sa_family) {
2044 src_addr = (struct sockaddr *) &id->route.addr.src_addr;
2045 if ((src_addr->sa_family = dst_addr->sa_family) == AF_INET6) {
2046 ((struct sockaddr_in6 *) src_addr)->sin6_scope_id =
2047 ((struct sockaddr_in6 *) dst_addr)->sin6_scope_id;
2048 }
2049 }
2050 return rdma_bind_addr(id, src_addr);
e51060f0
SH
2051}
2052
2053int rdma_resolve_addr(struct rdma_cm_id *id, struct sockaddr *src_addr,
2054 struct sockaddr *dst_addr, int timeout_ms)
2055{
2056 struct rdma_id_private *id_priv;
2057 int ret;
2058
2059 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 2060 if (id_priv->state == RDMA_CM_IDLE) {
e51060f0
SH
2061 ret = cma_bind_addr(id, src_addr, dst_addr);
2062 if (ret)
2063 return ret;
2064 }
2065
550e5ca7 2066 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_ADDR_QUERY))
e51060f0
SH
2067 return -EINVAL;
2068
2069 atomic_inc(&id_priv->refcount);
2070 memcpy(&id->route.addr.dst_addr, dst_addr, ip_addr_size(dst_addr));
2071 if (cma_any_addr(dst_addr))
2072 ret = cma_resolve_loopback(id_priv);
2073 else
3f446754 2074 ret = rdma_resolve_ip(&addr_client, (struct sockaddr *) &id->route.addr.src_addr,
7a118df3 2075 dst_addr, &id->route.addr.dev_addr,
e51060f0
SH
2076 timeout_ms, addr_handler, id_priv);
2077 if (ret)
2078 goto err;
2079
2080 return 0;
2081err:
550e5ca7 2082 cma_comp_exch(id_priv, RDMA_CM_ADDR_QUERY, RDMA_CM_ADDR_BOUND);
e51060f0
SH
2083 cma_deref_id(id_priv);
2084 return ret;
2085}
2086EXPORT_SYMBOL(rdma_resolve_addr);
2087
a9bb7912
HS
2088int rdma_set_reuseaddr(struct rdma_cm_id *id, int reuse)
2089{
2090 struct rdma_id_private *id_priv;
2091 unsigned long flags;
2092 int ret;
2093
2094 id_priv = container_of(id, struct rdma_id_private, id);
2095 spin_lock_irqsave(&id_priv->lock, flags);
550e5ca7 2096 if (id_priv->state == RDMA_CM_IDLE) {
a9bb7912
HS
2097 id_priv->reuseaddr = reuse;
2098 ret = 0;
2099 } else {
2100 ret = -EINVAL;
2101 }
2102 spin_unlock_irqrestore(&id_priv->lock, flags);
2103 return ret;
2104}
2105EXPORT_SYMBOL(rdma_set_reuseaddr);
2106
e51060f0
SH
2107static void cma_bind_port(struct rdma_bind_list *bind_list,
2108 struct rdma_id_private *id_priv)
2109{
2110 struct sockaddr_in *sin;
2111
2112 sin = (struct sockaddr_in *) &id_priv->id.route.addr.src_addr;
2113 sin->sin_port = htons(bind_list->port);
2114 id_priv->bind_list = bind_list;
2115 hlist_add_head(&id_priv->node, &bind_list->owners);
2116}
2117
2118static int cma_alloc_port(struct idr *ps, struct rdma_id_private *id_priv,
2119 unsigned short snum)
2120{
2121 struct rdma_bind_list *bind_list;
aedec080 2122 int port, ret;
e51060f0 2123
cb164b8c 2124 bind_list = kzalloc(sizeof *bind_list, GFP_KERNEL);
e51060f0
SH
2125 if (!bind_list)
2126 return -ENOMEM;
2127
aedec080
SH
2128 do {
2129 ret = idr_get_new_above(ps, bind_list, snum, &port);
2130 } while ((ret == -EAGAIN) && idr_pre_get(ps, GFP_KERNEL));
2131
2132 if (ret)
2133 goto err1;
2134
2135 if (port != snum) {
2136 ret = -EADDRNOTAVAIL;
2137 goto err2;
2138 }
2139
2140 bind_list->ps = ps;
2141 bind_list->port = (unsigned short) port;
2142 cma_bind_port(bind_list, id_priv);
2143 return 0;
2144err2:
2145 idr_remove(ps, port);
2146err1:
2147 kfree(bind_list);
2148 return ret;
2149}
e51060f0 2150
aedec080
SH
2151static int cma_alloc_any_port(struct idr *ps, struct rdma_id_private *id_priv)
2152{
5d7220e8
TH
2153 static unsigned int last_used_port;
2154 int low, high, remaining;
2155 unsigned int rover;
e51060f0 2156
227b60f5 2157 inet_get_local_port_range(&low, &high);
5d7220e8
TH
2158 remaining = (high - low) + 1;
2159 rover = net_random() % remaining + low;
2160retry:
2161 if (last_used_port != rover &&
2162 !idr_find(ps, (unsigned short) rover)) {
2163 int ret = cma_alloc_port(ps, id_priv, rover);
2164 /*
2165 * Remember previously used port number in order to avoid
2166 * re-using same port immediately after it is closed.
2167 */
2168 if (!ret)
2169 last_used_port = rover;
2170 if (ret != -EADDRNOTAVAIL)
2171 return ret;
e51060f0 2172 }
5d7220e8
TH
2173 if (--remaining) {
2174 rover++;
2175 if ((rover < low) || (rover > high))
2176 rover = low;
2177 goto retry;
2178 }
2179 return -EADDRNOTAVAIL;
e51060f0
SH
2180}
2181
a9bb7912
HS
2182/*
2183 * Check that the requested port is available. This is called when trying to
2184 * bind to a specific port, or when trying to listen on a bound port. In
2185 * the latter case, the provided id_priv may already be on the bind_list, but
2186 * we still need to check that it's okay to start listening.
2187 */
2188static int cma_check_port(struct rdma_bind_list *bind_list,
2189 struct rdma_id_private *id_priv, uint8_t reuseaddr)
e51060f0
SH
2190{
2191 struct rdma_id_private *cur_id;
43b752da 2192 struct sockaddr *addr, *cur_addr;
e51060f0 2193 struct hlist_node *node;
e51060f0 2194
43b752da 2195 addr = (struct sockaddr *) &id_priv->id.route.addr.src_addr;
e51060f0 2196 hlist_for_each_entry(cur_id, node, &bind_list->owners, node) {
a9bb7912
HS
2197 if (id_priv == cur_id)
2198 continue;
3cd96564 2199
5b0ec991
SH
2200 if ((cur_id->state != RDMA_CM_LISTEN) && reuseaddr &&
2201 cur_id->reuseaddr)
2202 continue;
e51060f0 2203
5b0ec991
SH
2204 cur_addr = (struct sockaddr *) &cur_id->id.route.addr.src_addr;
2205 if (id_priv->afonly && cur_id->afonly &&
2206 (addr->sa_family != cur_addr->sa_family))
2207 continue;
2208
2209 if (cma_any_addr(addr) || cma_any_addr(cur_addr))
2210 return -EADDRNOTAVAIL;
2211
2212 if (!cma_addr_cmp(addr, cur_addr))
2213 return -EADDRINUSE;
a9bb7912 2214 }
e51060f0
SH
2215 return 0;
2216}
2217
a9bb7912
HS
2218static int cma_use_port(struct idr *ps, struct rdma_id_private *id_priv)
2219{
2220 struct rdma_bind_list *bind_list;
2221 unsigned short snum;
2222 int ret;
2223
2224 snum = ntohs(cma_port((struct sockaddr *) &id_priv->id.route.addr.src_addr));
2225 if (snum < PROT_SOCK && !capable(CAP_NET_BIND_SERVICE))
2226 return -EACCES;
2227
2228 bind_list = idr_find(ps, snum);
2229 if (!bind_list) {
2230 ret = cma_alloc_port(ps, id_priv, snum);
2231 } else {
2232 ret = cma_check_port(bind_list, id_priv, id_priv->reuseaddr);
2233 if (!ret)
2234 cma_bind_port(bind_list, id_priv);
2235 }
2236 return ret;
2237}
2238
2239static int cma_bind_listen(struct rdma_id_private *id_priv)
2240{
2241 struct rdma_bind_list *bind_list = id_priv->bind_list;
2242 int ret = 0;
2243
2244 mutex_lock(&lock);
2245 if (bind_list->owners.first->next)
2246 ret = cma_check_port(bind_list, id_priv, 0);
2247 mutex_unlock(&lock);
2248 return ret;
2249}
2250
e51060f0
SH
2251static int cma_get_port(struct rdma_id_private *id_priv)
2252{
2253 struct idr *ps;
2254 int ret;
2255
2256 switch (id_priv->id.ps) {
2257 case RDMA_PS_SDP:
2258 ps = &sdp_ps;
2259 break;
2260 case RDMA_PS_TCP:
2261 ps = &tcp_ps;
2262 break;
628e5f6d
SH
2263 case RDMA_PS_UDP:
2264 ps = &udp_ps;
2265 break;
c8f6a362
SH
2266 case RDMA_PS_IPOIB:
2267 ps = &ipoib_ps;
2268 break;
2d2e9415
SH
2269 case RDMA_PS_IB:
2270 ps = &ib_ps;
2271 break;
e51060f0
SH
2272 default:
2273 return -EPROTONOSUPPORT;
2274 }
2275
2276 mutex_lock(&lock);
3f446754 2277 if (cma_any_port((struct sockaddr *) &id_priv->id.route.addr.src_addr))
aedec080 2278 ret = cma_alloc_any_port(ps, id_priv);
e51060f0
SH
2279 else
2280 ret = cma_use_port(ps, id_priv);
2281 mutex_unlock(&lock);
2282
2283 return ret;
2284}
2285
d14714df
SH
2286static int cma_check_linklocal(struct rdma_dev_addr *dev_addr,
2287 struct sockaddr *addr)
2288{
fd4582a3 2289#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
d14714df
SH
2290 struct sockaddr_in6 *sin6;
2291
2292 if (addr->sa_family != AF_INET6)
2293 return 0;
2294
2295 sin6 = (struct sockaddr_in6 *) addr;
2296 if ((ipv6_addr_type(&sin6->sin6_addr) & IPV6_ADDR_LINKLOCAL) &&
2297 !sin6->sin6_scope_id)
2298 return -EINVAL;
2299
2300 dev_addr->bound_dev_if = sin6->sin6_scope_id;
2301#endif
2302 return 0;
2303}
2304
a9bb7912
HS
2305int rdma_listen(struct rdma_cm_id *id, int backlog)
2306{
2307 struct rdma_id_private *id_priv;
2308 int ret;
2309
2310 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 2311 if (id_priv->state == RDMA_CM_IDLE) {
a9bb7912
HS
2312 ((struct sockaddr *) &id->route.addr.src_addr)->sa_family = AF_INET;
2313 ret = rdma_bind_addr(id, (struct sockaddr *) &id->route.addr.src_addr);
2314 if (ret)
2315 return ret;
2316 }
2317
550e5ca7 2318 if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_LISTEN))
a9bb7912
HS
2319 return -EINVAL;
2320
2321 if (id_priv->reuseaddr) {
2322 ret = cma_bind_listen(id_priv);
2323 if (ret)
2324 goto err;
2325 }
2326
2327 id_priv->backlog = backlog;
2328 if (id->device) {
2329 switch (rdma_node_get_transport(id->device->node_type)) {
2330 case RDMA_TRANSPORT_IB:
2331 ret = cma_ib_listen(id_priv);
2332 if (ret)
2333 goto err;
2334 break;
2335 case RDMA_TRANSPORT_IWARP:
2336 ret = cma_iw_listen(id_priv, backlog);
2337 if (ret)
2338 goto err;
2339 break;
2340 default:
2341 ret = -ENOSYS;
2342 goto err;
2343 }
2344 } else
2345 cma_listen_on_all(id_priv);
2346
2347 return 0;
2348err:
2349 id_priv->backlog = 0;
550e5ca7 2350 cma_comp_exch(id_priv, RDMA_CM_LISTEN, RDMA_CM_ADDR_BOUND);
a9bb7912
HS
2351 return ret;
2352}
2353EXPORT_SYMBOL(rdma_listen);
2354
e51060f0
SH
2355int rdma_bind_addr(struct rdma_cm_id *id, struct sockaddr *addr)
2356{
2357 struct rdma_id_private *id_priv;
2358 int ret;
2359
1f5175ad 2360 if (addr->sa_family != AF_INET && addr->sa_family != AF_INET6)
e51060f0
SH
2361 return -EAFNOSUPPORT;
2362
2363 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 2364 if (!cma_comp_exch(id_priv, RDMA_CM_IDLE, RDMA_CM_ADDR_BOUND))
e51060f0
SH
2365 return -EINVAL;
2366
d14714df
SH
2367 ret = cma_check_linklocal(&id->route.addr.dev_addr, addr);
2368 if (ret)
2369 goto err1;
2370
8523c048 2371 if (!cma_any_addr(addr)) {
e51060f0 2372 ret = rdma_translate_ip(addr, &id->route.addr.dev_addr);
e51060f0 2373 if (ret)
255d0c14
KK
2374 goto err1;
2375
255d0c14 2376 ret = cma_acquire_dev(id_priv);
255d0c14
KK
2377 if (ret)
2378 goto err1;
e51060f0
SH
2379 }
2380
2381 memcpy(&id->route.addr.src_addr, addr, ip_addr_size(addr));
5b0ec991
SH
2382 if (addr->sa_family == AF_INET)
2383 id_priv->afonly = 1;
2384#if IS_ENABLED(CONFIG_IPV6)
2385 else if (addr->sa_family == AF_INET6)
2386 id_priv->afonly = init_net.ipv6.sysctl.bindv6only;
2387#endif
e51060f0
SH
2388 ret = cma_get_port(id_priv);
2389 if (ret)
255d0c14 2390 goto err2;
e51060f0
SH
2391
2392 return 0;
255d0c14 2393err2:
a396d43a
SH
2394 if (id_priv->cma_dev)
2395 cma_release_dev(id_priv);
255d0c14 2396err1:
550e5ca7 2397 cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_IDLE);
e51060f0
SH
2398 return ret;
2399}
2400EXPORT_SYMBOL(rdma_bind_addr);
2401
2402static int cma_format_hdr(void *hdr, enum rdma_port_space ps,
2403 struct rdma_route *route)
2404{
e51060f0
SH
2405 struct cma_hdr *cma_hdr;
2406 struct sdp_hh *sdp_hdr;
2407
1f5175ad
AS
2408 if (route->addr.src_addr.ss_family == AF_INET) {
2409 struct sockaddr_in *src4, *dst4;
2410
2411 src4 = (struct sockaddr_in *) &route->addr.src_addr;
2412 dst4 = (struct sockaddr_in *) &route->addr.dst_addr;
2413
2414 switch (ps) {
2415 case RDMA_PS_SDP:
2416 sdp_hdr = hdr;
2417 if (sdp_get_majv(sdp_hdr->sdp_version) != SDP_MAJ_VERSION)
2418 return -EINVAL;
2419 sdp_set_ip_ver(sdp_hdr, 4);
2420 sdp_hdr->src_addr.ip4.addr = src4->sin_addr.s_addr;
2421 sdp_hdr->dst_addr.ip4.addr = dst4->sin_addr.s_addr;
2422 sdp_hdr->port = src4->sin_port;
2423 break;
2424 default:
2425 cma_hdr = hdr;
2426 cma_hdr->cma_version = CMA_VERSION;
2427 cma_set_ip_ver(cma_hdr, 4);
2428 cma_hdr->src_addr.ip4.addr = src4->sin_addr.s_addr;
2429 cma_hdr->dst_addr.ip4.addr = dst4->sin_addr.s_addr;
2430 cma_hdr->port = src4->sin_port;
2431 break;
2432 }
2433 } else {
2434 struct sockaddr_in6 *src6, *dst6;
2435
2436 src6 = (struct sockaddr_in6 *) &route->addr.src_addr;
2437 dst6 = (struct sockaddr_in6 *) &route->addr.dst_addr;
2438
2439 switch (ps) {
2440 case RDMA_PS_SDP:
2441 sdp_hdr = hdr;
2442 if (sdp_get_majv(sdp_hdr->sdp_version) != SDP_MAJ_VERSION)
2443 return -EINVAL;
2444 sdp_set_ip_ver(sdp_hdr, 6);
2445 sdp_hdr->src_addr.ip6 = src6->sin6_addr;
2446 sdp_hdr->dst_addr.ip6 = dst6->sin6_addr;
2447 sdp_hdr->port = src6->sin6_port;
2448 break;
2449 default:
2450 cma_hdr = hdr;
2451 cma_hdr->cma_version = CMA_VERSION;
2452 cma_set_ip_ver(cma_hdr, 6);
2453 cma_hdr->src_addr.ip6 = src6->sin6_addr;
2454 cma_hdr->dst_addr.ip6 = dst6->sin6_addr;
2455 cma_hdr->port = src6->sin6_port;
2456 break;
2457 }
e51060f0
SH
2458 }
2459 return 0;
2460}
2461
628e5f6d
SH
2462static int cma_sidr_rep_handler(struct ib_cm_id *cm_id,
2463 struct ib_cm_event *ib_event)
2464{
2465 struct rdma_id_private *id_priv = cm_id->context;
2466 struct rdma_cm_event event;
2467 struct ib_cm_sidr_rep_event_param *rep = &ib_event->param.sidr_rep_rcvd;
2468 int ret = 0;
2469
550e5ca7 2470 if (cma_disable_callback(id_priv, RDMA_CM_CONNECT))
8aa08602 2471 return 0;
628e5f6d 2472
8aa08602 2473 memset(&event, 0, sizeof event);
628e5f6d
SH
2474 switch (ib_event->event) {
2475 case IB_CM_SIDR_REQ_ERROR:
2476 event.event = RDMA_CM_EVENT_UNREACHABLE;
2477 event.status = -ETIMEDOUT;
2478 break;
2479 case IB_CM_SIDR_REP_RECEIVED:
2480 event.param.ud.private_data = ib_event->private_data;
2481 event.param.ud.private_data_len = IB_CM_SIDR_REP_PRIVATE_DATA_SIZE;
2482 if (rep->status != IB_SIDR_SUCCESS) {
2483 event.event = RDMA_CM_EVENT_UNREACHABLE;
2484 event.status = ib_event->param.sidr_rep_rcvd.status;
2485 break;
2486 }
d2ca39f2
YE
2487 ret = cma_set_qkey(id_priv);
2488 if (ret) {
2489 event.event = RDMA_CM_EVENT_ADDR_ERROR;
2490 event.status = -EINVAL;
2491 break;
2492 }
c8f6a362 2493 if (id_priv->qkey != rep->qkey) {
628e5f6d
SH
2494 event.event = RDMA_CM_EVENT_UNREACHABLE;
2495 event.status = -EINVAL;
2496 break;
2497 }
2498 ib_init_ah_from_path(id_priv->id.device, id_priv->id.port_num,
2499 id_priv->id.route.path_rec,
2500 &event.param.ud.ah_attr);
2501 event.param.ud.qp_num = rep->qpn;
2502 event.param.ud.qkey = rep->qkey;
2503 event.event = RDMA_CM_EVENT_ESTABLISHED;
2504 event.status = 0;
2505 break;
2506 default:
468f2239 2507 printk(KERN_ERR "RDMA CMA: unexpected IB CM event: %d\n",
628e5f6d
SH
2508 ib_event->event);
2509 goto out;
2510 }
2511
2512 ret = id_priv->id.event_handler(&id_priv->id, &event);
2513 if (ret) {
2514 /* Destroy the CM ID by returning a non-zero value. */
2515 id_priv->cm_id.ib = NULL;
550e5ca7 2516 cma_exch(id_priv, RDMA_CM_DESTROYING);
de910bd9 2517 mutex_unlock(&id_priv->handler_mutex);
628e5f6d
SH
2518 rdma_destroy_id(&id_priv->id);
2519 return ret;
2520 }
2521out:
de910bd9 2522 mutex_unlock(&id_priv->handler_mutex);
628e5f6d
SH
2523 return ret;
2524}
2525
2526static int cma_resolve_ib_udp(struct rdma_id_private *id_priv,
2527 struct rdma_conn_param *conn_param)
2528{
2529 struct ib_cm_sidr_req_param req;
2530 struct rdma_route *route;
0c9361fc 2531 struct ib_cm_id *id;
628e5f6d
SH
2532 int ret;
2533
2534 req.private_data_len = sizeof(struct cma_hdr) +
2535 conn_param->private_data_len;
04ded167
SH
2536 if (req.private_data_len < conn_param->private_data_len)
2537 return -EINVAL;
2538
628e5f6d
SH
2539 req.private_data = kzalloc(req.private_data_len, GFP_ATOMIC);
2540 if (!req.private_data)
2541 return -ENOMEM;
2542
2543 if (conn_param->private_data && conn_param->private_data_len)
2544 memcpy((void *) req.private_data + sizeof(struct cma_hdr),
2545 conn_param->private_data, conn_param->private_data_len);
2546
2547 route = &id_priv->id.route;
2548 ret = cma_format_hdr((void *) req.private_data, id_priv->id.ps, route);
2549 if (ret)
2550 goto out;
2551
0c9361fc
JM
2552 id = ib_create_cm_id(id_priv->id.device, cma_sidr_rep_handler,
2553 id_priv);
2554 if (IS_ERR(id)) {
2555 ret = PTR_ERR(id);
628e5f6d
SH
2556 goto out;
2557 }
0c9361fc 2558 id_priv->cm_id.ib = id;
628e5f6d
SH
2559
2560 req.path = route->path_rec;
2561 req.service_id = cma_get_service_id(id_priv->id.ps,
3f446754 2562 (struct sockaddr *) &route->addr.dst_addr);
628e5f6d
SH
2563 req.timeout_ms = 1 << (CMA_CM_RESPONSE_TIMEOUT - 8);
2564 req.max_cm_retries = CMA_MAX_CM_RETRIES;
2565
2566 ret = ib_send_cm_sidr_req(id_priv->cm_id.ib, &req);
2567 if (ret) {
2568 ib_destroy_cm_id(id_priv->cm_id.ib);
2569 id_priv->cm_id.ib = NULL;
2570 }
2571out:
2572 kfree(req.private_data);
2573 return ret;
2574}
2575
e51060f0
SH
2576static int cma_connect_ib(struct rdma_id_private *id_priv,
2577 struct rdma_conn_param *conn_param)
2578{
2579 struct ib_cm_req_param req;
2580 struct rdma_route *route;
2581 void *private_data;
0c9361fc 2582 struct ib_cm_id *id;
e51060f0
SH
2583 int offset, ret;
2584
2585 memset(&req, 0, sizeof req);
2586 offset = cma_user_data_offset(id_priv->id.ps);
2587 req.private_data_len = offset + conn_param->private_data_len;
04ded167
SH
2588 if (req.private_data_len < conn_param->private_data_len)
2589 return -EINVAL;
2590
e51060f0
SH
2591 private_data = kzalloc(req.private_data_len, GFP_ATOMIC);
2592 if (!private_data)
2593 return -ENOMEM;
2594
2595 if (conn_param->private_data && conn_param->private_data_len)
2596 memcpy(private_data + offset, conn_param->private_data,
2597 conn_param->private_data_len);
2598
0c9361fc
JM
2599 id = ib_create_cm_id(id_priv->id.device, cma_ib_handler, id_priv);
2600 if (IS_ERR(id)) {
2601 ret = PTR_ERR(id);
e51060f0
SH
2602 goto out;
2603 }
0c9361fc 2604 id_priv->cm_id.ib = id;
e51060f0
SH
2605
2606 route = &id_priv->id.route;
2607 ret = cma_format_hdr(private_data, id_priv->id.ps, route);
2608 if (ret)
2609 goto out;
2610 req.private_data = private_data;
2611
2612 req.primary_path = &route->path_rec[0];
2613 if (route->num_paths == 2)
2614 req.alternate_path = &route->path_rec[1];
2615
2616 req.service_id = cma_get_service_id(id_priv->id.ps,
3f446754 2617 (struct sockaddr *) &route->addr.dst_addr);
e51060f0 2618 req.qp_num = id_priv->qp_num;
18c441a6 2619 req.qp_type = id_priv->id.qp_type;
e51060f0
SH
2620 req.starting_psn = id_priv->seq_num;
2621 req.responder_resources = conn_param->responder_resources;
2622 req.initiator_depth = conn_param->initiator_depth;
2623 req.flow_control = conn_param->flow_control;
2624 req.retry_count = conn_param->retry_count;
2625 req.rnr_retry_count = conn_param->rnr_retry_count;
2626 req.remote_cm_response_timeout = CMA_CM_RESPONSE_TIMEOUT;
2627 req.local_cm_response_timeout = CMA_CM_RESPONSE_TIMEOUT;
2628 req.max_cm_retries = CMA_MAX_CM_RETRIES;
2629 req.srq = id_priv->srq ? 1 : 0;
2630
2631 ret = ib_send_cm_req(id_priv->cm_id.ib, &req);
2632out:
0c9361fc
JM
2633 if (ret && !IS_ERR(id)) {
2634 ib_destroy_cm_id(id);
675a027c
KK
2635 id_priv->cm_id.ib = NULL;
2636 }
2637
e51060f0
SH
2638 kfree(private_data);
2639 return ret;
2640}
2641
07ebafba
TT
2642static int cma_connect_iw(struct rdma_id_private *id_priv,
2643 struct rdma_conn_param *conn_param)
2644{
2645 struct iw_cm_id *cm_id;
2646 struct sockaddr_in* sin;
2647 int ret;
2648 struct iw_cm_conn_param iw_param;
2649
2650 cm_id = iw_create_cm_id(id_priv->id.device, cma_iw_handler, id_priv);
0c9361fc
JM
2651 if (IS_ERR(cm_id))
2652 return PTR_ERR(cm_id);
07ebafba
TT
2653
2654 id_priv->cm_id.iw = cm_id;
2655
2656 sin = (struct sockaddr_in*) &id_priv->id.route.addr.src_addr;
2657 cm_id->local_addr = *sin;
2658
2659 sin = (struct sockaddr_in*) &id_priv->id.route.addr.dst_addr;
2660 cm_id->remote_addr = *sin;
2661
5851bb89 2662 ret = cma_modify_qp_rtr(id_priv, conn_param);
675a027c
KK
2663 if (ret)
2664 goto out;
07ebafba 2665
f45ee80e
HS
2666 if (conn_param) {
2667 iw_param.ord = conn_param->initiator_depth;
2668 iw_param.ird = conn_param->responder_resources;
2669 iw_param.private_data = conn_param->private_data;
2670 iw_param.private_data_len = conn_param->private_data_len;
2671 iw_param.qpn = id_priv->id.qp ? id_priv->qp_num : conn_param->qp_num;
2672 } else {
2673 memset(&iw_param, 0, sizeof iw_param);
07ebafba 2674 iw_param.qpn = id_priv->qp_num;
f45ee80e 2675 }
07ebafba
TT
2676 ret = iw_cm_connect(cm_id, &iw_param);
2677out:
0c9361fc 2678 if (ret) {
675a027c
KK
2679 iw_destroy_cm_id(cm_id);
2680 id_priv->cm_id.iw = NULL;
2681 }
07ebafba
TT
2682 return ret;
2683}
2684
e51060f0
SH
2685int rdma_connect(struct rdma_cm_id *id, struct rdma_conn_param *conn_param)
2686{
2687 struct rdma_id_private *id_priv;
2688 int ret;
2689
2690 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7 2691 if (!cma_comp_exch(id_priv, RDMA_CM_ROUTE_RESOLVED, RDMA_CM_CONNECT))
e51060f0
SH
2692 return -EINVAL;
2693
2694 if (!id->qp) {
2695 id_priv->qp_num = conn_param->qp_num;
e51060f0
SH
2696 id_priv->srq = conn_param->srq;
2697 }
2698
07ebafba
TT
2699 switch (rdma_node_get_transport(id->device->node_type)) {
2700 case RDMA_TRANSPORT_IB:
b26f9b99 2701 if (id->qp_type == IB_QPT_UD)
628e5f6d
SH
2702 ret = cma_resolve_ib_udp(id_priv, conn_param);
2703 else
2704 ret = cma_connect_ib(id_priv, conn_param);
e51060f0 2705 break;
07ebafba
TT
2706 case RDMA_TRANSPORT_IWARP:
2707 ret = cma_connect_iw(id_priv, conn_param);
2708 break;
e51060f0
SH
2709 default:
2710 ret = -ENOSYS;
2711 break;
2712 }
2713 if (ret)
2714 goto err;
2715
2716 return 0;
2717err:
550e5ca7 2718 cma_comp_exch(id_priv, RDMA_CM_CONNECT, RDMA_CM_ROUTE_RESOLVED);
e51060f0
SH
2719 return ret;
2720}
2721EXPORT_SYMBOL(rdma_connect);
2722
2723static int cma_accept_ib(struct rdma_id_private *id_priv,
2724 struct rdma_conn_param *conn_param)
2725{
2726 struct ib_cm_rep_param rep;
5851bb89 2727 int ret;
0fe313b0 2728
5851bb89
SH
2729 ret = cma_modify_qp_rtr(id_priv, conn_param);
2730 if (ret)
2731 goto out;
0fe313b0 2732
5851bb89
SH
2733 ret = cma_modify_qp_rts(id_priv, conn_param);
2734 if (ret)
2735 goto out;
e51060f0
SH
2736
2737 memset(&rep, 0, sizeof rep);
2738 rep.qp_num = id_priv->qp_num;
2739 rep.starting_psn = id_priv->seq_num;
2740 rep.private_data = conn_param->private_data;
2741 rep.private_data_len = conn_param->private_data_len;
2742 rep.responder_resources = conn_param->responder_resources;
2743 rep.initiator_depth = conn_param->initiator_depth;
e51060f0
SH
2744 rep.failover_accepted = 0;
2745 rep.flow_control = conn_param->flow_control;
2746 rep.rnr_retry_count = conn_param->rnr_retry_count;
2747 rep.srq = id_priv->srq ? 1 : 0;
2748
0fe313b0
SH
2749 ret = ib_send_cm_rep(id_priv->cm_id.ib, &rep);
2750out:
2751 return ret;
e51060f0
SH
2752}
2753
07ebafba
TT
2754static int cma_accept_iw(struct rdma_id_private *id_priv,
2755 struct rdma_conn_param *conn_param)
2756{
2757 struct iw_cm_conn_param iw_param;
2758 int ret;
2759
5851bb89 2760 ret = cma_modify_qp_rtr(id_priv, conn_param);
07ebafba
TT
2761 if (ret)
2762 return ret;
2763
2764 iw_param.ord = conn_param->initiator_depth;
2765 iw_param.ird = conn_param->responder_resources;
2766 iw_param.private_data = conn_param->private_data;
2767 iw_param.private_data_len = conn_param->private_data_len;
2768 if (id_priv->id.qp) {
2769 iw_param.qpn = id_priv->qp_num;
2770 } else
2771 iw_param.qpn = conn_param->qp_num;
2772
2773 return iw_cm_accept(id_priv->cm_id.iw, &iw_param);
2774}
2775
628e5f6d
SH
2776static int cma_send_sidr_rep(struct rdma_id_private *id_priv,
2777 enum ib_cm_sidr_status status,
2778 const void *private_data, int private_data_len)
2779{
2780 struct ib_cm_sidr_rep_param rep;
d2ca39f2 2781 int ret;
628e5f6d
SH
2782
2783 memset(&rep, 0, sizeof rep);
2784 rep.status = status;
2785 if (status == IB_SIDR_SUCCESS) {
d2ca39f2
YE
2786 ret = cma_set_qkey(id_priv);
2787 if (ret)
2788 return ret;
628e5f6d 2789 rep.qp_num = id_priv->qp_num;
c8f6a362 2790 rep.qkey = id_priv->qkey;
628e5f6d
SH
2791 }
2792 rep.private_data = private_data;
2793 rep.private_data_len = private_data_len;
2794
2795 return ib_send_cm_sidr_rep(id_priv->cm_id.ib, &rep);
2796}
2797
e51060f0
SH
2798int rdma_accept(struct rdma_cm_id *id, struct rdma_conn_param *conn_param)
2799{
2800 struct rdma_id_private *id_priv;
2801 int ret;
2802
2803 id_priv = container_of(id, struct rdma_id_private, id);
83e9502d
NM
2804
2805 id_priv->owner = task_pid_nr(current);
2806
550e5ca7 2807 if (!cma_comp(id_priv, RDMA_CM_CONNECT))
e51060f0
SH
2808 return -EINVAL;
2809
2810 if (!id->qp && conn_param) {
2811 id_priv->qp_num = conn_param->qp_num;
e51060f0
SH
2812 id_priv->srq = conn_param->srq;
2813 }
2814
07ebafba
TT
2815 switch (rdma_node_get_transport(id->device->node_type)) {
2816 case RDMA_TRANSPORT_IB:
f45ee80e
HS
2817 if (id->qp_type == IB_QPT_UD) {
2818 if (conn_param)
2819 ret = cma_send_sidr_rep(id_priv, IB_SIDR_SUCCESS,
2820 conn_param->private_data,
2821 conn_param->private_data_len);
2822 else
2823 ret = cma_send_sidr_rep(id_priv, IB_SIDR_SUCCESS,
2824 NULL, 0);
2825 } else {
2826 if (conn_param)
2827 ret = cma_accept_ib(id_priv, conn_param);
2828 else
2829 ret = cma_rep_recv(id_priv);
2830 }
e51060f0 2831 break;
07ebafba
TT
2832 case RDMA_TRANSPORT_IWARP:
2833 ret = cma_accept_iw(id_priv, conn_param);
2834 break;
e51060f0
SH
2835 default:
2836 ret = -ENOSYS;
2837 break;
2838 }
2839
2840 if (ret)
2841 goto reject;
2842
2843 return 0;
2844reject:
c5483388 2845 cma_modify_qp_err(id_priv);
e51060f0
SH
2846 rdma_reject(id, NULL, 0);
2847 return ret;
2848}
2849EXPORT_SYMBOL(rdma_accept);
2850
0fe313b0
SH
2851int rdma_notify(struct rdma_cm_id *id, enum ib_event_type event)
2852{
2853 struct rdma_id_private *id_priv;
2854 int ret;
2855
2856 id_priv = container_of(id, struct rdma_id_private, id);
0c9361fc 2857 if (!id_priv->cm_id.ib)
0fe313b0
SH
2858 return -EINVAL;
2859
2860 switch (id->device->node_type) {
2861 case RDMA_NODE_IB_CA:
2862 ret = ib_cm_notify(id_priv->cm_id.ib, event);
2863 break;
2864 default:
2865 ret = 0;
2866 break;
2867 }
2868 return ret;
2869}
2870EXPORT_SYMBOL(rdma_notify);
2871
e51060f0
SH
2872int rdma_reject(struct rdma_cm_id *id, const void *private_data,
2873 u8 private_data_len)
2874{
2875 struct rdma_id_private *id_priv;
2876 int ret;
2877
2878 id_priv = container_of(id, struct rdma_id_private, id);
0c9361fc 2879 if (!id_priv->cm_id.ib)
e51060f0
SH
2880 return -EINVAL;
2881
07ebafba
TT
2882 switch (rdma_node_get_transport(id->device->node_type)) {
2883 case RDMA_TRANSPORT_IB:
b26f9b99 2884 if (id->qp_type == IB_QPT_UD)
628e5f6d
SH
2885 ret = cma_send_sidr_rep(id_priv, IB_SIDR_REJECT,
2886 private_data, private_data_len);
2887 else
2888 ret = ib_send_cm_rej(id_priv->cm_id.ib,
2889 IB_CM_REJ_CONSUMER_DEFINED, NULL,
2890 0, private_data, private_data_len);
e51060f0 2891 break;
07ebafba
TT
2892 case RDMA_TRANSPORT_IWARP:
2893 ret = iw_cm_reject(id_priv->cm_id.iw,
2894 private_data, private_data_len);
2895 break;
e51060f0
SH
2896 default:
2897 ret = -ENOSYS;
2898 break;
2899 }
2900 return ret;
2901}
2902EXPORT_SYMBOL(rdma_reject);
2903
2904int rdma_disconnect(struct rdma_cm_id *id)
2905{
2906 struct rdma_id_private *id_priv;
2907 int ret;
2908
2909 id_priv = container_of(id, struct rdma_id_private, id);
0c9361fc 2910 if (!id_priv->cm_id.ib)
e51060f0
SH
2911 return -EINVAL;
2912
07ebafba
TT
2913 switch (rdma_node_get_transport(id->device->node_type)) {
2914 case RDMA_TRANSPORT_IB:
c5483388 2915 ret = cma_modify_qp_err(id_priv);
07ebafba
TT
2916 if (ret)
2917 goto out;
e51060f0
SH
2918 /* Initiate or respond to a disconnect. */
2919 if (ib_send_cm_dreq(id_priv->cm_id.ib, NULL, 0))
2920 ib_send_cm_drep(id_priv->cm_id.ib, NULL, 0);
2921 break;
07ebafba
TT
2922 case RDMA_TRANSPORT_IWARP:
2923 ret = iw_cm_disconnect(id_priv->cm_id.iw, 0);
2924 break;
e51060f0 2925 default:
07ebafba 2926 ret = -EINVAL;
e51060f0
SH
2927 break;
2928 }
2929out:
2930 return ret;
2931}
2932EXPORT_SYMBOL(rdma_disconnect);
2933
c8f6a362
SH
2934static int cma_ib_mc_handler(int status, struct ib_sa_multicast *multicast)
2935{
2936 struct rdma_id_private *id_priv;
2937 struct cma_multicast *mc = multicast->context;
2938 struct rdma_cm_event event;
2939 int ret;
2940
2941 id_priv = mc->id_priv;
550e5ca7
NM
2942 if (cma_disable_callback(id_priv, RDMA_CM_ADDR_BOUND) &&
2943 cma_disable_callback(id_priv, RDMA_CM_ADDR_RESOLVED))
8aa08602 2944 return 0;
c8f6a362 2945
c5483388 2946 mutex_lock(&id_priv->qp_mutex);
c8f6a362
SH
2947 if (!status && id_priv->id.qp)
2948 status = ib_attach_mcast(id_priv->id.qp, &multicast->rec.mgid,
46ea5061 2949 be16_to_cpu(multicast->rec.mlid));
c5483388 2950 mutex_unlock(&id_priv->qp_mutex);
c8f6a362
SH
2951
2952 memset(&event, 0, sizeof event);
2953 event.status = status;
2954 event.param.ud.private_data = mc->context;
2955 if (!status) {
2956 event.event = RDMA_CM_EVENT_MULTICAST_JOIN;
2957 ib_init_ah_from_mcmember(id_priv->id.device,
2958 id_priv->id.port_num, &multicast->rec,
2959 &event.param.ud.ah_attr);
2960 event.param.ud.qp_num = 0xFFFFFF;
2961 event.param.ud.qkey = be32_to_cpu(multicast->rec.qkey);
2962 } else
2963 event.event = RDMA_CM_EVENT_MULTICAST_ERROR;
2964
2965 ret = id_priv->id.event_handler(&id_priv->id, &event);
2966 if (ret) {
550e5ca7 2967 cma_exch(id_priv, RDMA_CM_DESTROYING);
de910bd9 2968 mutex_unlock(&id_priv->handler_mutex);
c8f6a362
SH
2969 rdma_destroy_id(&id_priv->id);
2970 return 0;
2971 }
8aa08602 2972
de910bd9 2973 mutex_unlock(&id_priv->handler_mutex);
c8f6a362
SH
2974 return 0;
2975}
2976
2977static void cma_set_mgid(struct rdma_id_private *id_priv,
2978 struct sockaddr *addr, union ib_gid *mgid)
2979{
2980 unsigned char mc_map[MAX_ADDR_LEN];
2981 struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
2982 struct sockaddr_in *sin = (struct sockaddr_in *) addr;
2983 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *) addr;
2984
2985 if (cma_any_addr(addr)) {
2986 memset(mgid, 0, sizeof *mgid);
2987 } else if ((addr->sa_family == AF_INET6) &&
1c9b2819 2988 ((be32_to_cpu(sin6->sin6_addr.s6_addr32[0]) & 0xFFF0FFFF) ==
c8f6a362
SH
2989 0xFF10A01B)) {
2990 /* IPv6 address is an SA assigned MGID. */
2991 memcpy(mgid, &sin6->sin6_addr, sizeof *mgid);
e2e62697
JG
2992 } else if ((addr->sa_family == AF_INET6)) {
2993 ipv6_ib_mc_map(&sin6->sin6_addr, dev_addr->broadcast, mc_map);
2994 if (id_priv->id.ps == RDMA_PS_UDP)
2995 mc_map[7] = 0x01; /* Use RDMA CM signature */
2996 *mgid = *(union ib_gid *) (mc_map + 4);
c8f6a362 2997 } else {
a9e527e3 2998 ip_ib_mc_map(sin->sin_addr.s_addr, dev_addr->broadcast, mc_map);
c8f6a362
SH
2999 if (id_priv->id.ps == RDMA_PS_UDP)
3000 mc_map[7] = 0x01; /* Use RDMA CM signature */
c8f6a362
SH
3001 *mgid = *(union ib_gid *) (mc_map + 4);
3002 }
3003}
3004
3005static int cma_join_ib_multicast(struct rdma_id_private *id_priv,
3006 struct cma_multicast *mc)
3007{
3008 struct ib_sa_mcmember_rec rec;
3009 struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
3010 ib_sa_comp_mask comp_mask;
3011 int ret;
3012
3013 ib_addr_get_mgid(dev_addr, &rec.mgid);
3014 ret = ib_sa_get_mcmember_rec(id_priv->id.device, id_priv->id.port_num,
3015 &rec.mgid, &rec);
3016 if (ret)
3017 return ret;
3018
3f446754 3019 cma_set_mgid(id_priv, (struct sockaddr *) &mc->addr, &rec.mgid);
c8f6a362
SH
3020 if (id_priv->id.ps == RDMA_PS_UDP)
3021 rec.qkey = cpu_to_be32(RDMA_UDP_QKEY);
6f8372b6 3022 rdma_addr_get_sgid(dev_addr, &rec.port_gid);
c8f6a362
SH
3023 rec.pkey = cpu_to_be16(ib_addr_get_pkey(dev_addr));
3024 rec.join_state = 1;
3025
3026 comp_mask = IB_SA_MCMEMBER_REC_MGID | IB_SA_MCMEMBER_REC_PORT_GID |
3027 IB_SA_MCMEMBER_REC_PKEY | IB_SA_MCMEMBER_REC_JOIN_STATE |
3028 IB_SA_MCMEMBER_REC_QKEY | IB_SA_MCMEMBER_REC_SL |
3029 IB_SA_MCMEMBER_REC_FLOW_LABEL |
3030 IB_SA_MCMEMBER_REC_TRAFFIC_CLASS;
3031
84adeee9
YE
3032 if (id_priv->id.ps == RDMA_PS_IPOIB)
3033 comp_mask |= IB_SA_MCMEMBER_REC_RATE |
3034 IB_SA_MCMEMBER_REC_RATE_SELECTOR;
3035
c8f6a362
SH
3036 mc->multicast.ib = ib_sa_join_multicast(&sa_client, id_priv->id.device,
3037 id_priv->id.port_num, &rec,
3038 comp_mask, GFP_KERNEL,
3039 cma_ib_mc_handler, mc);
3040 if (IS_ERR(mc->multicast.ib))
3041 return PTR_ERR(mc->multicast.ib);
3042
3043 return 0;
3044}
3045
3c86aa70
EC
3046static void iboe_mcast_work_handler(struct work_struct *work)
3047{
3048 struct iboe_mcast_work *mw = container_of(work, struct iboe_mcast_work, work);
3049 struct cma_multicast *mc = mw->mc;
3050 struct ib_sa_multicast *m = mc->multicast.ib;
3051
3052 mc->multicast.ib->context = mc;
3053 cma_ib_mc_handler(0, m);
3054 kref_put(&mc->mcref, release_mc);
3055 kfree(mw);
3056}
3057
3058static void cma_iboe_set_mgid(struct sockaddr *addr, union ib_gid *mgid)
3059{
3060 struct sockaddr_in *sin = (struct sockaddr_in *)addr;
3061 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr;
3062
3063 if (cma_any_addr(addr)) {
3064 memset(mgid, 0, sizeof *mgid);
3065 } else if (addr->sa_family == AF_INET6) {
3066 memcpy(mgid, &sin6->sin6_addr, sizeof *mgid);
3067 } else {
3068 mgid->raw[0] = 0xff;
3069 mgid->raw[1] = 0x0e;
3070 mgid->raw[2] = 0;
3071 mgid->raw[3] = 0;
3072 mgid->raw[4] = 0;
3073 mgid->raw[5] = 0;
3074 mgid->raw[6] = 0;
3075 mgid->raw[7] = 0;
3076 mgid->raw[8] = 0;
3077 mgid->raw[9] = 0;
3078 mgid->raw[10] = 0xff;
3079 mgid->raw[11] = 0xff;
3080 *(__be32 *)(&mgid->raw[12]) = sin->sin_addr.s_addr;
3081 }
3082}
3083
3084static int cma_iboe_join_multicast(struct rdma_id_private *id_priv,
3085 struct cma_multicast *mc)
3086{
3087 struct iboe_mcast_work *work;
3088 struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
3089 int err;
3090 struct sockaddr *addr = (struct sockaddr *)&mc->addr;
3091 struct net_device *ndev = NULL;
3092
3093 if (cma_zero_addr((struct sockaddr *)&mc->addr))
3094 return -EINVAL;
3095
3096 work = kzalloc(sizeof *work, GFP_KERNEL);
3097 if (!work)
3098 return -ENOMEM;
3099
3100 mc->multicast.ib = kzalloc(sizeof(struct ib_sa_multicast), GFP_KERNEL);
3101 if (!mc->multicast.ib) {
3102 err = -ENOMEM;
3103 goto out1;
3104 }
3105
3106 cma_iboe_set_mgid(addr, &mc->multicast.ib->rec.mgid);
3107
3108 mc->multicast.ib->rec.pkey = cpu_to_be16(0xffff);
3109 if (id_priv->id.ps == RDMA_PS_UDP)
3110 mc->multicast.ib->rec.qkey = cpu_to_be32(RDMA_UDP_QKEY);
3111
3112 if (dev_addr->bound_dev_if)
3113 ndev = dev_get_by_index(&init_net, dev_addr->bound_dev_if);
3114 if (!ndev) {
3115 err = -ENODEV;
3116 goto out2;
3117 }
3118 mc->multicast.ib->rec.rate = iboe_get_rate(ndev);
3119 mc->multicast.ib->rec.hop_limit = 1;
3120 mc->multicast.ib->rec.mtu = iboe_get_mtu(ndev->mtu);
3121 dev_put(ndev);
3122 if (!mc->multicast.ib->rec.mtu) {
3123 err = -EINVAL;
3124 goto out2;
3125 }
3126 iboe_addr_get_sgid(dev_addr, &mc->multicast.ib->rec.port_gid);
3127 work->id = id_priv;
3128 work->mc = mc;
3129 INIT_WORK(&work->work, iboe_mcast_work_handler);
3130 kref_get(&mc->mcref);
3131 queue_work(cma_wq, &work->work);
3132
3133 return 0;
3134
3135out2:
3136 kfree(mc->multicast.ib);
3137out1:
3138 kfree(work);
3139 return err;
3140}
3141
c8f6a362
SH
3142int rdma_join_multicast(struct rdma_cm_id *id, struct sockaddr *addr,
3143 void *context)
3144{
3145 struct rdma_id_private *id_priv;
3146 struct cma_multicast *mc;
3147 int ret;
3148
3149 id_priv = container_of(id, struct rdma_id_private, id);
550e5ca7
NM
3150 if (!cma_comp(id_priv, RDMA_CM_ADDR_BOUND) &&
3151 !cma_comp(id_priv, RDMA_CM_ADDR_RESOLVED))
c8f6a362
SH
3152 return -EINVAL;
3153
3154 mc = kmalloc(sizeof *mc, GFP_KERNEL);
3155 if (!mc)
3156 return -ENOMEM;
3157
3158 memcpy(&mc->addr, addr, ip_addr_size(addr));
3159 mc->context = context;
3160 mc->id_priv = id_priv;
3161
3162 spin_lock(&id_priv->lock);
3163 list_add(&mc->list, &id_priv->mc_list);
3164 spin_unlock(&id_priv->lock);
3165
3166 switch (rdma_node_get_transport(id->device->node_type)) {
3167 case RDMA_TRANSPORT_IB:
3c86aa70
EC
3168 switch (rdma_port_get_link_layer(id->device, id->port_num)) {
3169 case IB_LINK_LAYER_INFINIBAND:
3170 ret = cma_join_ib_multicast(id_priv, mc);
3171 break;
3172 case IB_LINK_LAYER_ETHERNET:
3173 kref_init(&mc->mcref);
3174 ret = cma_iboe_join_multicast(id_priv, mc);
3175 break;
3176 default:
3177 ret = -EINVAL;
3178 }
c8f6a362
SH
3179 break;
3180 default:
3181 ret = -ENOSYS;
3182 break;
3183 }
3184
3185 if (ret) {
3186 spin_lock_irq(&id_priv->lock);
3187 list_del(&mc->list);
3188 spin_unlock_irq(&id_priv->lock);
3189 kfree(mc);
3190 }
3191 return ret;
3192}
3193EXPORT_SYMBOL(rdma_join_multicast);
3194
3195void rdma_leave_multicast(struct rdma_cm_id *id, struct sockaddr *addr)
3196{
3197 struct rdma_id_private *id_priv;
3198 struct cma_multicast *mc;
3199
3200 id_priv = container_of(id, struct rdma_id_private, id);
3201 spin_lock_irq(&id_priv->lock);
3202 list_for_each_entry(mc, &id_priv->mc_list, list) {
3203 if (!memcmp(&mc->addr, addr, ip_addr_size(addr))) {
3204 list_del(&mc->list);
3205 spin_unlock_irq(&id_priv->lock);
3206
3207 if (id->qp)
3208 ib_detach_mcast(id->qp,
3209 &mc->multicast.ib->rec.mgid,
46ea5061 3210 be16_to_cpu(mc->multicast.ib->rec.mlid));
3c86aa70
EC
3211 if (rdma_node_get_transport(id_priv->cma_dev->device->node_type) == RDMA_TRANSPORT_IB) {
3212 switch (rdma_port_get_link_layer(id->device, id->port_num)) {
3213 case IB_LINK_LAYER_INFINIBAND:
3214 ib_sa_free_multicast(mc->multicast.ib);
3215 kfree(mc);
3216 break;
3217 case IB_LINK_LAYER_ETHERNET:
3218 kref_put(&mc->mcref, release_mc);
3219 break;
3220 default:
3221 break;
3222 }
3223 }
c8f6a362
SH
3224 return;
3225 }
3226 }
3227 spin_unlock_irq(&id_priv->lock);
3228}
3229EXPORT_SYMBOL(rdma_leave_multicast);
3230
dd5bdff8
OG
3231static int cma_netdev_change(struct net_device *ndev, struct rdma_id_private *id_priv)
3232{
3233 struct rdma_dev_addr *dev_addr;
3234 struct cma_ndev_work *work;
3235
3236 dev_addr = &id_priv->id.route.addr.dev_addr;
3237
6266ed6e 3238 if ((dev_addr->bound_dev_if == ndev->ifindex) &&
dd5bdff8
OG
3239 memcmp(dev_addr->src_dev_addr, ndev->dev_addr, ndev->addr_len)) {
3240 printk(KERN_INFO "RDMA CM addr change for ndev %s used by id %p\n",
3241 ndev->name, &id_priv->id);
3242 work = kzalloc(sizeof *work, GFP_KERNEL);
3243 if (!work)
3244 return -ENOMEM;
3245
3246 INIT_WORK(&work->work, cma_ndev_work_handler);
3247 work->id = id_priv;
3248 work->event.event = RDMA_CM_EVENT_ADDR_CHANGE;
3249 atomic_inc(&id_priv->refcount);
3250 queue_work(cma_wq, &work->work);
3251 }
3252
3253 return 0;
3254}
3255
3256static int cma_netdev_callback(struct notifier_block *self, unsigned long event,
3257 void *ctx)
3258{
3259 struct net_device *ndev = (struct net_device *)ctx;
3260 struct cma_device *cma_dev;
3261 struct rdma_id_private *id_priv;
3262 int ret = NOTIFY_DONE;
3263
3264 if (dev_net(ndev) != &init_net)
3265 return NOTIFY_DONE;
3266
3267 if (event != NETDEV_BONDING_FAILOVER)
3268 return NOTIFY_DONE;
3269
3270 if (!(ndev->flags & IFF_MASTER) || !(ndev->priv_flags & IFF_BONDING))
3271 return NOTIFY_DONE;
3272
3273 mutex_lock(&lock);
3274 list_for_each_entry(cma_dev, &dev_list, list)
3275 list_for_each_entry(id_priv, &cma_dev->id_list, list) {
3276 ret = cma_netdev_change(ndev, id_priv);
3277 if (ret)
3278 goto out;
3279 }
3280
3281out:
3282 mutex_unlock(&lock);
3283 return ret;
3284}
3285
3286static struct notifier_block cma_nb = {
3287 .notifier_call = cma_netdev_callback
3288};
3289
e51060f0
SH
3290static void cma_add_one(struct ib_device *device)
3291{
3292 struct cma_device *cma_dev;
3293 struct rdma_id_private *id_priv;
3294
3295 cma_dev = kmalloc(sizeof *cma_dev, GFP_KERNEL);
3296 if (!cma_dev)
3297 return;
3298
3299 cma_dev->device = device;
e51060f0
SH
3300
3301 init_completion(&cma_dev->comp);
3302 atomic_set(&cma_dev->refcount, 1);
3303 INIT_LIST_HEAD(&cma_dev->id_list);
3304 ib_set_client_data(device, &cma_client, cma_dev);
3305
3306 mutex_lock(&lock);
3307 list_add_tail(&cma_dev->list, &dev_list);
3308 list_for_each_entry(id_priv, &listen_any_list, list)
3309 cma_listen_on_dev(id_priv, cma_dev);
3310 mutex_unlock(&lock);
e51060f0
SH
3311}
3312
3313static int cma_remove_id_dev(struct rdma_id_private *id_priv)
3314{
a1b1b61f 3315 struct rdma_cm_event event;
550e5ca7 3316 enum rdma_cm_state state;
de910bd9 3317 int ret = 0;
e51060f0
SH
3318
3319 /* Record that we want to remove the device */
550e5ca7
NM
3320 state = cma_exch(id_priv, RDMA_CM_DEVICE_REMOVAL);
3321 if (state == RDMA_CM_DESTROYING)
e51060f0
SH
3322 return 0;
3323
3324 cma_cancel_operation(id_priv, state);
de910bd9 3325 mutex_lock(&id_priv->handler_mutex);
e51060f0
SH
3326
3327 /* Check for destruction from another callback. */
550e5ca7 3328 if (!cma_comp(id_priv, RDMA_CM_DEVICE_REMOVAL))
de910bd9 3329 goto out;
e51060f0 3330
a1b1b61f
SH
3331 memset(&event, 0, sizeof event);
3332 event.event = RDMA_CM_EVENT_DEVICE_REMOVAL;
de910bd9
OG
3333 ret = id_priv->id.event_handler(&id_priv->id, &event);
3334out:
3335 mutex_unlock(&id_priv->handler_mutex);
3336 return ret;
e51060f0
SH
3337}
3338
3339static void cma_process_remove(struct cma_device *cma_dev)
3340{
e51060f0
SH
3341 struct rdma_id_private *id_priv;
3342 int ret;
3343
e51060f0
SH
3344 mutex_lock(&lock);
3345 while (!list_empty(&cma_dev->id_list)) {
3346 id_priv = list_entry(cma_dev->id_list.next,
3347 struct rdma_id_private, list);
3348
d02d1f53 3349 list_del(&id_priv->listen_list);
94de178a 3350 list_del_init(&id_priv->list);
e51060f0
SH
3351 atomic_inc(&id_priv->refcount);
3352 mutex_unlock(&lock);
3353
d02d1f53 3354 ret = id_priv->internal_id ? 1 : cma_remove_id_dev(id_priv);
e51060f0
SH
3355 cma_deref_id(id_priv);
3356 if (ret)
3357 rdma_destroy_id(&id_priv->id);
3358
3359 mutex_lock(&lock);
3360 }
3361 mutex_unlock(&lock);
3362
3363 cma_deref_dev(cma_dev);
3364 wait_for_completion(&cma_dev->comp);
3365}
3366
3367static void cma_remove_one(struct ib_device *device)
3368{
3369 struct cma_device *cma_dev;
3370
3371 cma_dev = ib_get_client_data(device, &cma_client);
3372 if (!cma_dev)
3373 return;
3374
3375 mutex_lock(&lock);
3376 list_del(&cma_dev->list);
3377 mutex_unlock(&lock);
3378
3379 cma_process_remove(cma_dev);
3380 kfree(cma_dev);
3381}
3382
753f618a
NM
3383static int cma_get_id_stats(struct sk_buff *skb, struct netlink_callback *cb)
3384{
3385 struct nlmsghdr *nlh;
3386 struct rdma_cm_id_stats *id_stats;
3387 struct rdma_id_private *id_priv;
3388 struct rdma_cm_id *id = NULL;
3389 struct cma_device *cma_dev;
3390 int i_dev = 0, i_id = 0;
3391
3392 /*
3393 * We export all of the IDs as a sequence of messages. Each
3394 * ID gets its own netlink message.
3395 */
3396 mutex_lock(&lock);
3397
3398 list_for_each_entry(cma_dev, &dev_list, list) {
3399 if (i_dev < cb->args[0]) {
3400 i_dev++;
3401 continue;
3402 }
3403
3404 i_id = 0;
3405 list_for_each_entry(id_priv, &cma_dev->id_list, list) {
3406 if (i_id < cb->args[1]) {
3407 i_id++;
3408 continue;
3409 }
3410
3411 id_stats = ibnl_put_msg(skb, &nlh, cb->nlh->nlmsg_seq,
3412 sizeof *id_stats, RDMA_NL_RDMA_CM,
3413 RDMA_NL_RDMA_CM_ID_STATS);
3414 if (!id_stats)
3415 goto out;
3416
3417 memset(id_stats, 0, sizeof *id_stats);
3418 id = &id_priv->id;
3419 id_stats->node_type = id->route.addr.dev_addr.dev_type;
3420 id_stats->port_num = id->port_num;
3421 id_stats->bound_dev_if =
3422 id->route.addr.dev_addr.bound_dev_if;
3423
3424 if (id->route.addr.src_addr.ss_family == AF_INET) {
3425 if (ibnl_put_attr(skb, nlh,
3426 sizeof(struct sockaddr_in),
3427 &id->route.addr.src_addr,
3428 RDMA_NL_RDMA_CM_ATTR_SRC_ADDR)) {
3429 goto out;
3430 }
3431 if (ibnl_put_attr(skb, nlh,
3432 sizeof(struct sockaddr_in),
3433 &id->route.addr.dst_addr,
3434 RDMA_NL_RDMA_CM_ATTR_DST_ADDR)) {
3435 goto out;
3436 }
3437 } else if (id->route.addr.src_addr.ss_family == AF_INET6) {
3438 if (ibnl_put_attr(skb, nlh,
3439 sizeof(struct sockaddr_in6),
3440 &id->route.addr.src_addr,
3441 RDMA_NL_RDMA_CM_ATTR_SRC_ADDR)) {
3442 goto out;
3443 }
3444 if (ibnl_put_attr(skb, nlh,
3445 sizeof(struct sockaddr_in6),
3446 &id->route.addr.dst_addr,
3447 RDMA_NL_RDMA_CM_ATTR_DST_ADDR)) {
3448 goto out;
3449 }
3450 }
3451
83e9502d 3452 id_stats->pid = id_priv->owner;
753f618a
NM
3453 id_stats->port_space = id->ps;
3454 id_stats->cm_state = id_priv->state;
3455 id_stats->qp_num = id_priv->qp_num;
3456 id_stats->qp_type = id->qp_type;
3457
3458 i_id++;
3459 }
3460
3461 cb->args[1] = 0;
3462 i_dev++;
3463 }
3464
3465out:
3466 mutex_unlock(&lock);
3467 cb->args[0] = i_dev;
3468 cb->args[1] = i_id;
3469
3470 return skb->len;
3471}
3472
3473static const struct ibnl_client_cbs cma_cb_table[] = {
3474 [RDMA_NL_RDMA_CM_ID_STATS] = { .dump = cma_get_id_stats },
3475};
3476
716abb1f 3477static int __init cma_init(void)
e51060f0 3478{
5d7220e8 3479 int ret;
227b60f5 3480
c7f743a6 3481 cma_wq = create_singlethread_workqueue("rdma_cm");
e51060f0
SH
3482 if (!cma_wq)
3483 return -ENOMEM;
3484
c1a0b23b 3485 ib_sa_register_client(&sa_client);
7a118df3 3486 rdma_addr_register_client(&addr_client);
dd5bdff8 3487 register_netdevice_notifier(&cma_nb);
c1a0b23b 3488
e51060f0
SH
3489 ret = ib_register_client(&cma_client);
3490 if (ret)
3491 goto err;
753f618a
NM
3492
3493 if (ibnl_add_client(RDMA_NL_RDMA_CM, RDMA_NL_RDMA_CM_NUM_OPS, cma_cb_table))
3494 printk(KERN_WARNING "RDMA CMA: failed to add netlink callback\n");
3495
e51060f0
SH
3496 return 0;
3497
3498err:
dd5bdff8 3499 unregister_netdevice_notifier(&cma_nb);
7a118df3 3500 rdma_addr_unregister_client(&addr_client);
c1a0b23b 3501 ib_sa_unregister_client(&sa_client);
e51060f0
SH
3502 destroy_workqueue(cma_wq);
3503 return ret;
3504}
3505
716abb1f 3506static void __exit cma_cleanup(void)
e51060f0 3507{
753f618a 3508 ibnl_remove_client(RDMA_NL_RDMA_CM);
e51060f0 3509 ib_unregister_client(&cma_client);
dd5bdff8 3510 unregister_netdevice_notifier(&cma_nb);
7a118df3 3511 rdma_addr_unregister_client(&addr_client);
c1a0b23b 3512 ib_sa_unregister_client(&sa_client);
e51060f0
SH
3513 destroy_workqueue(cma_wq);
3514 idr_destroy(&sdp_ps);
3515 idr_destroy(&tcp_ps);
628e5f6d 3516 idr_destroy(&udp_ps);
c8f6a362 3517 idr_destroy(&ipoib_ps);
2d2e9415 3518 idr_destroy(&ib_ps);
e51060f0
SH
3519}
3520
3521module_init(cma_init);
3522module_exit(cma_cleanup);