IB/mlx4: Fix port query for 56Gb Ethernet links
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / drivers / infiniband / hw / mlx4 / main.c
CommitLineData
225c7b1f
RD
1/*
2 * Copyright (c) 2006, 2007 Cisco Systems, Inc. All rights reserved.
51a379d0 3 * Copyright (c) 2007, 2008 Mellanox Technologies. All rights reserved.
225c7b1f
RD
4 *
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
10 *
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
14 *
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
18 *
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
23 *
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
32 */
33
34#include <linux/module.h>
35#include <linux/init.h>
5a0e3ad6 36#include <linux/slab.h>
225c7b1f 37#include <linux/errno.h>
fa417f7b
EC
38#include <linux/netdevice.h>
39#include <linux/inetdevice.h>
40#include <linux/rtnetlink.h>
4c3eb3ca 41#include <linux/if_vlan.h>
225c7b1f
RD
42
43#include <rdma/ib_smi.h>
44#include <rdma/ib_user_verbs.h>
fa417f7b 45#include <rdma/ib_addr.h>
225c7b1f
RD
46
47#include <linux/mlx4/driver.h>
48#include <linux/mlx4/cmd.h>
49
50#include "mlx4_ib.h"
51#include "user.h"
52
b1d8eb5a 53#define DRV_NAME MLX4_IB_DRV_NAME
068c4ea1
JM
54#define DRV_VERSION "1.0"
55#define DRV_RELDATE "April 4, 2008"
225c7b1f
RD
56
57MODULE_AUTHOR("Roland Dreier");
58MODULE_DESCRIPTION("Mellanox ConnectX HCA InfiniBand driver");
59MODULE_LICENSE("Dual BSD/GPL");
60MODULE_VERSION(DRV_VERSION);
61
a0c64a17
JM
62int mlx4_ib_sm_guid_assign = 1;
63module_param_named(sm_guid_assign, mlx4_ib_sm_guid_assign, int, 0444);
64MODULE_PARM_DESC(sm_guid_assign, "Enable SM alias_GUID assignment if sm_guid_assign > 0 (Default: 1)");
65
68f3948d 66static const char mlx4_ib_version[] =
225c7b1f
RD
67 DRV_NAME ": Mellanox ConnectX InfiniBand driver v"
68 DRV_VERSION " (" DRV_RELDATE ")\n";
69
fa417f7b
EC
70struct update_gid_work {
71 struct work_struct work;
72 union ib_gid gids[128];
73 struct mlx4_ib_dev *dev;
74 int port;
75};
76
3806d08c
JM
77static void do_slave_init(struct mlx4_ib_dev *ibdev, int slave, int do_init);
78
fa417f7b
EC
79static struct workqueue_struct *wq;
80
225c7b1f
RD
81static void init_query_mad(struct ib_smp *mad)
82{
83 mad->base_version = 1;
84 mad->mgmt_class = IB_MGMT_CLASS_SUBN_LID_ROUTED;
85 mad->class_version = 1;
86 mad->method = IB_MGMT_METHOD_GET;
87}
88
4c3eb3ca
EC
89static union ib_gid zgid;
90
225c7b1f
RD
91static int mlx4_ib_query_device(struct ib_device *ibdev,
92 struct ib_device_attr *props)
93{
94 struct mlx4_ib_dev *dev = to_mdev(ibdev);
95 struct ib_smp *in_mad = NULL;
96 struct ib_smp *out_mad = NULL;
97 int err = -ENOMEM;
98
99 in_mad = kzalloc(sizeof *in_mad, GFP_KERNEL);
100 out_mad = kmalloc(sizeof *out_mad, GFP_KERNEL);
101 if (!in_mad || !out_mad)
102 goto out;
103
104 init_query_mad(in_mad);
105 in_mad->attr_id = IB_SMP_ATTR_NODE_INFO;
106
0a9a0188
JM
107 err = mlx4_MAD_IFC(to_mdev(ibdev), MLX4_MAD_IFC_IGNORE_KEYS,
108 1, NULL, NULL, in_mad, out_mad);
225c7b1f
RD
109 if (err)
110 goto out;
111
112 memset(props, 0, sizeof *props);
113
114 props->fw_ver = dev->dev->caps.fw_ver;
115 props->device_cap_flags = IB_DEVICE_CHANGE_PHY_PORT |
116 IB_DEVICE_PORT_ACTIVE_EVENT |
117 IB_DEVICE_SYS_IMAGE_GUID |
521e575b
RL
118 IB_DEVICE_RC_RNR_NAK_GEN |
119 IB_DEVICE_BLOCK_MULTICAST_LOOPBACK;
225c7b1f
RD
120 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_BAD_PKEY_CNTR)
121 props->device_cap_flags |= IB_DEVICE_BAD_PKEY_CNTR;
122 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_BAD_QKEY_CNTR)
123 props->device_cap_flags |= IB_DEVICE_BAD_QKEY_CNTR;
124 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_APM)
125 props->device_cap_flags |= IB_DEVICE_AUTO_PATH_MIG;
126 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_UD_AV_PORT)
127 props->device_cap_flags |= IB_DEVICE_UD_AV_PORT_ENFORCE;
8ff095ec
EC
128 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_IPOIB_CSUM)
129 props->device_cap_flags |= IB_DEVICE_UD_IP_CSUM;
417608c2 130 if (dev->dev->caps.max_gso_sz && dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_BLH)
b832be1e 131 props->device_cap_flags |= IB_DEVICE_UD_TSO;
95d04f07
RD
132 if (dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_RESERVED_LKEY)
133 props->device_cap_flags |= IB_DEVICE_LOCAL_DMA_LKEY;
134 if ((dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_LOCAL_INV) &&
135 (dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_REMOTE_INV) &&
136 (dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_FAST_REG_WR))
137 props->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
0a1405da
SH
138 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_XRC)
139 props->device_cap_flags |= IB_DEVICE_XRC;
b425388d
SM
140 if (dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_MEM_WINDOW)
141 props->device_cap_flags |= IB_DEVICE_MEM_WINDOW;
142 if (dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_TYPE_2_WIN) {
143 if (dev->dev->caps.bmme_flags & MLX4_BMME_FLAG_WIN_TYPE_2B)
144 props->device_cap_flags |= IB_DEVICE_MEM_WINDOW_TYPE_2B;
145 else
146 props->device_cap_flags |= IB_DEVICE_MEM_WINDOW_TYPE_2A;
147 }
225c7b1f
RD
148
149 props->vendor_id = be32_to_cpup((__be32 *) (out_mad->data + 36)) &
150 0xffffff;
992e8e6e 151 props->vendor_part_id = dev->dev->pdev->device;
225c7b1f
RD
152 props->hw_ver = be32_to_cpup((__be32 *) (out_mad->data + 32));
153 memcpy(&props->sys_image_guid, out_mad->data + 4, 8);
154
155 props->max_mr_size = ~0ull;
156 props->page_size_cap = dev->dev->caps.page_size_cap;
157 props->max_qp = dev->dev->caps.num_qps - dev->dev->caps.reserved_qps;
fc2d0044 158 props->max_qp_wr = dev->dev->caps.max_wqes - MLX4_IB_SQ_MAX_SPARE;
225c7b1f
RD
159 props->max_sge = min(dev->dev->caps.max_sq_sg,
160 dev->dev->caps.max_rq_sg);
161 props->max_cq = dev->dev->caps.num_cqs - dev->dev->caps.reserved_cqs;
162 props->max_cqe = dev->dev->caps.max_cqes;
163 props->max_mr = dev->dev->caps.num_mpts - dev->dev->caps.reserved_mrws;
164 props->max_pd = dev->dev->caps.num_pds - dev->dev->caps.reserved_pds;
165 props->max_qp_rd_atom = dev->dev->caps.max_qp_dest_rdma;
166 props->max_qp_init_rd_atom = dev->dev->caps.max_qp_init_rdma;
167 props->max_res_rd_atom = props->max_qp_rd_atom * props->max_qp;
168 props->max_srq = dev->dev->caps.num_srqs - dev->dev->caps.reserved_srqs;
c8681f14 169 props->max_srq_wr = dev->dev->caps.max_srq_wqes - 1;
225c7b1f 170 props->max_srq_sge = dev->dev->caps.max_srq_sge;
5a0fd094 171 props->max_fast_reg_page_list_len = MLX4_MAX_FAST_REG_PAGES;
225c7b1f
RD
172 props->local_ca_ack_delay = dev->dev->caps.local_ca_ack_delay;
173 props->atomic_cap = dev->dev->caps.flags & MLX4_DEV_CAP_FLAG_ATOMIC ?
174 IB_ATOMIC_HCA : IB_ATOMIC_NONE;
47e956b2 175 props->masked_atomic_cap = props->atomic_cap;
5ae2a7a8 176 props->max_pkeys = dev->dev->caps.pkey_table_len[1];
225c7b1f
RD
177 props->max_mcast_grp = dev->dev->caps.num_mgms + dev->dev->caps.num_amgms;
178 props->max_mcast_qp_attach = dev->dev->caps.num_qp_per_mgm;
179 props->max_total_mcast_qp_attach = props->max_mcast_qp_attach *
180 props->max_mcast_grp;
a5bbe892 181 props->max_map_per_fmr = dev->dev->caps.max_fmr_maps;
225c7b1f
RD
182
183out:
184 kfree(in_mad);
185 kfree(out_mad);
186
187 return err;
188}
189
fa417f7b
EC
190static enum rdma_link_layer
191mlx4_ib_port_link_layer(struct ib_device *device, u8 port_num)
225c7b1f 192{
fa417f7b 193 struct mlx4_dev *dev = to_mdev(device)->dev;
225c7b1f 194
65dab25d 195 return dev->caps.port_mask[port_num] == MLX4_PORT_TYPE_IB ?
fa417f7b
EC
196 IB_LINK_LAYER_INFINIBAND : IB_LINK_LAYER_ETHERNET;
197}
225c7b1f 198
fa417f7b 199static int ib_link_query_port(struct ib_device *ibdev, u8 port,
0a9a0188 200 struct ib_port_attr *props, int netw_view)
fa417f7b 201{
a9c766bb
OG
202 struct ib_smp *in_mad = NULL;
203 struct ib_smp *out_mad = NULL;
a5e12dff 204 int ext_active_speed;
0a9a0188 205 int mad_ifc_flags = MLX4_MAD_IFC_IGNORE_KEYS;
a9c766bb
OG
206 int err = -ENOMEM;
207
208 in_mad = kzalloc(sizeof *in_mad, GFP_KERNEL);
209 out_mad = kmalloc(sizeof *out_mad, GFP_KERNEL);
210 if (!in_mad || !out_mad)
211 goto out;
212
213 init_query_mad(in_mad);
214 in_mad->attr_id = IB_SMP_ATTR_PORT_INFO;
215 in_mad->attr_mod = cpu_to_be32(port);
216
0a9a0188
JM
217 if (mlx4_is_mfunc(to_mdev(ibdev)->dev) && netw_view)
218 mad_ifc_flags |= MLX4_MAD_IFC_NET_VIEW;
219
220 err = mlx4_MAD_IFC(to_mdev(ibdev), mad_ifc_flags, port, NULL, NULL,
a9c766bb
OG
221 in_mad, out_mad);
222 if (err)
223 goto out;
224
a5e12dff 225
225c7b1f
RD
226 props->lid = be16_to_cpup((__be16 *) (out_mad->data + 16));
227 props->lmc = out_mad->data[34] & 0x7;
228 props->sm_lid = be16_to_cpup((__be16 *) (out_mad->data + 18));
229 props->sm_sl = out_mad->data[36] & 0xf;
230 props->state = out_mad->data[32] & 0xf;
231 props->phys_state = out_mad->data[33] >> 4;
232 props->port_cap_flags = be32_to_cpup((__be32 *) (out_mad->data + 20));
0a9a0188
JM
233 if (netw_view)
234 props->gid_tbl_len = out_mad->data[50];
235 else
236 props->gid_tbl_len = to_mdev(ibdev)->dev->caps.gid_table_len[port];
149983af 237 props->max_msg_sz = to_mdev(ibdev)->dev->caps.max_msg_sz;
5ae2a7a8 238 props->pkey_tbl_len = to_mdev(ibdev)->dev->caps.pkey_table_len[port];
225c7b1f
RD
239 props->bad_pkey_cntr = be16_to_cpup((__be16 *) (out_mad->data + 46));
240 props->qkey_viol_cntr = be16_to_cpup((__be16 *) (out_mad->data + 48));
241 props->active_width = out_mad->data[31] & 0xf;
242 props->active_speed = out_mad->data[35] >> 4;
243 props->max_mtu = out_mad->data[41] & 0xf;
244 props->active_mtu = out_mad->data[36] >> 4;
245 props->subnet_timeout = out_mad->data[51] & 0x1f;
246 props->max_vl_num = out_mad->data[37] >> 4;
247 props->init_type_reply = out_mad->data[41] >> 4;
248
a5e12dff
MA
249 /* Check if extended speeds (EDR/FDR/...) are supported */
250 if (props->port_cap_flags & IB_PORT_EXTENDED_SPEEDS_SUP) {
251 ext_active_speed = out_mad->data[62] >> 4;
252
253 switch (ext_active_speed) {
254 case 1:
2e96691c 255 props->active_speed = IB_SPEED_FDR;
a5e12dff
MA
256 break;
257 case 2:
2e96691c 258 props->active_speed = IB_SPEED_EDR;
a5e12dff
MA
259 break;
260 }
261 }
262
263 /* If reported active speed is QDR, check if is FDR-10 */
2e96691c 264 if (props->active_speed == IB_SPEED_QDR) {
8154c07f
OG
265 init_query_mad(in_mad);
266 in_mad->attr_id = MLX4_ATTR_EXTENDED_PORT_INFO;
267 in_mad->attr_mod = cpu_to_be32(port);
268
0a9a0188 269 err = mlx4_MAD_IFC(to_mdev(ibdev), mad_ifc_flags, port,
8154c07f
OG
270 NULL, NULL, in_mad, out_mad);
271 if (err)
bf6b47de 272 goto out;
8154c07f
OG
273
274 /* Checking LinkSpeedActive for FDR-10 */
275 if (out_mad->data[15] & 0x1)
276 props->active_speed = IB_SPEED_FDR10;
a5e12dff 277 }
d2ef4068
OG
278
279 /* Avoid wrong speed value returned by FW if the IB link is down. */
280 if (props->state == IB_PORT_DOWN)
281 props->active_speed = IB_SPEED_SDR;
282
a9c766bb
OG
283out:
284 kfree(in_mad);
285 kfree(out_mad);
286 return err;
fa417f7b
EC
287}
288
289static u8 state_to_phys_state(enum ib_port_state state)
290{
291 return state == IB_PORT_ACTIVE ? 5 : 3;
292}
293
294static int eth_link_query_port(struct ib_device *ibdev, u8 port,
0a9a0188 295 struct ib_port_attr *props, int netw_view)
fa417f7b 296{
a9c766bb
OG
297
298 struct mlx4_ib_dev *mdev = to_mdev(ibdev);
299 struct mlx4_ib_iboe *iboe = &mdev->iboe;
fa417f7b
EC
300 struct net_device *ndev;
301 enum ib_mtu tmp;
a9c766bb
OG
302 struct mlx4_cmd_mailbox *mailbox;
303 int err = 0;
304
305 mailbox = mlx4_alloc_cmd_mailbox(mdev->dev);
306 if (IS_ERR(mailbox))
307 return PTR_ERR(mailbox);
fa417f7b 308
a9c766bb
OG
309 err = mlx4_cmd_box(mdev->dev, 0, mailbox->dma, port, 0,
310 MLX4_CMD_QUERY_PORT, MLX4_CMD_TIME_CLASS_B,
311 MLX4_CMD_WRAPPED);
312 if (err)
313 goto out;
314
7d26287e
SM
315 props->active_width = (((u8 *)mailbox->buf)[5] == 0x40) ||
316 (((u8 *)mailbox->buf)[5] == 0x20 /*56Gb*/) ?
317 IB_WIDTH_4X : IB_WIDTH_1X;
318 props->active_speed = (((u8 *)mailbox->buf)[5] == 0x20 /*56Gb*/) ?
319 IB_SPEED_FDR : IB_SPEED_QDR;
fa417f7b 320 props->port_cap_flags = IB_PORT_CM_SUP;
a9c766bb
OG
321 props->gid_tbl_len = mdev->dev->caps.gid_table_len[port];
322 props->max_msg_sz = mdev->dev->caps.max_msg_sz;
fa417f7b 323 props->pkey_tbl_len = 1;
bcacb897 324 props->max_mtu = IB_MTU_4096;
a9c766bb 325 props->max_vl_num = 2;
fa417f7b
EC
326 props->state = IB_PORT_DOWN;
327 props->phys_state = state_to_phys_state(props->state);
328 props->active_mtu = IB_MTU_256;
329 spin_lock(&iboe->lock);
330 ndev = iboe->netdevs[port - 1];
331 if (!ndev)
a9c766bb 332 goto out_unlock;
fa417f7b
EC
333
334 tmp = iboe_get_mtu(ndev->mtu);
335 props->active_mtu = tmp ? min(props->max_mtu, tmp) : IB_MTU_256;
336
21d60609 337 props->state = (netif_running(ndev) && netif_carrier_ok(ndev)) ?
fa417f7b
EC
338 IB_PORT_ACTIVE : IB_PORT_DOWN;
339 props->phys_state = state_to_phys_state(props->state);
a9c766bb 340out_unlock:
fa417f7b 341 spin_unlock(&iboe->lock);
a9c766bb
OG
342out:
343 mlx4_free_cmd_mailbox(mdev->dev, mailbox);
344 return err;
fa417f7b
EC
345}
346
0a9a0188
JM
347int __mlx4_ib_query_port(struct ib_device *ibdev, u8 port,
348 struct ib_port_attr *props, int netw_view)
fa417f7b 349{
a9c766bb 350 int err;
fa417f7b
EC
351
352 memset(props, 0, sizeof *props);
353
fa417f7b 354 err = mlx4_ib_port_link_layer(ibdev, port) == IB_LINK_LAYER_INFINIBAND ?
0a9a0188
JM
355 ib_link_query_port(ibdev, port, props, netw_view) :
356 eth_link_query_port(ibdev, port, props, netw_view);
225c7b1f
RD
357
358 return err;
359}
360
0a9a0188
JM
361static int mlx4_ib_query_port(struct ib_device *ibdev, u8 port,
362 struct ib_port_attr *props)
363{
364 /* returns host view */
365 return __mlx4_ib_query_port(ibdev, port, props, 0);
366}
367
a0c64a17
JM
368int __mlx4_ib_query_gid(struct ib_device *ibdev, u8 port, int index,
369 union ib_gid *gid, int netw_view)
225c7b1f
RD
370{
371 struct ib_smp *in_mad = NULL;
372 struct ib_smp *out_mad = NULL;
373 int err = -ENOMEM;
a0c64a17
JM
374 struct mlx4_ib_dev *dev = to_mdev(ibdev);
375 int clear = 0;
376 int mad_ifc_flags = MLX4_MAD_IFC_IGNORE_KEYS;
225c7b1f
RD
377
378 in_mad = kzalloc(sizeof *in_mad, GFP_KERNEL);
379 out_mad = kmalloc(sizeof *out_mad, GFP_KERNEL);
380 if (!in_mad || !out_mad)
381 goto out;
382
383 init_query_mad(in_mad);
384 in_mad->attr_id = IB_SMP_ATTR_PORT_INFO;
385 in_mad->attr_mod = cpu_to_be32(port);
386
a0c64a17
JM
387 if (mlx4_is_mfunc(dev->dev) && netw_view)
388 mad_ifc_flags |= MLX4_MAD_IFC_NET_VIEW;
389
390 err = mlx4_MAD_IFC(dev, mad_ifc_flags, port, NULL, NULL, in_mad, out_mad);
225c7b1f
RD
391 if (err)
392 goto out;
393
394 memcpy(gid->raw, out_mad->data + 8, 8);
395
a0c64a17
JM
396 if (mlx4_is_mfunc(dev->dev) && !netw_view) {
397 if (index) {
398 /* For any index > 0, return the null guid */
399 err = 0;
400 clear = 1;
401 goto out;
402 }
403 }
404
225c7b1f
RD
405 init_query_mad(in_mad);
406 in_mad->attr_id = IB_SMP_ATTR_GUID_INFO;
407 in_mad->attr_mod = cpu_to_be32(index / 8);
408
a0c64a17 409 err = mlx4_MAD_IFC(dev, mad_ifc_flags, port,
0a9a0188 410 NULL, NULL, in_mad, out_mad);
225c7b1f
RD
411 if (err)
412 goto out;
413
414 memcpy(gid->raw + 8, out_mad->data + (index % 8) * 8, 8);
415
416out:
a0c64a17
JM
417 if (clear)
418 memset(gid->raw + 8, 0, 8);
225c7b1f
RD
419 kfree(in_mad);
420 kfree(out_mad);
421 return err;
422}
423
fa417f7b
EC
424static int iboe_query_gid(struct ib_device *ibdev, u8 port, int index,
425 union ib_gid *gid)
426{
427 struct mlx4_ib_dev *dev = to_mdev(ibdev);
428
429 *gid = dev->iboe.gid_table[port - 1][index];
430
431 return 0;
432}
433
434static int mlx4_ib_query_gid(struct ib_device *ibdev, u8 port, int index,
435 union ib_gid *gid)
436{
437 if (rdma_port_get_link_layer(ibdev, port) == IB_LINK_LAYER_INFINIBAND)
a0c64a17 438 return __mlx4_ib_query_gid(ibdev, port, index, gid, 0);
fa417f7b
EC
439 else
440 return iboe_query_gid(ibdev, port, index, gid);
441}
442
0a9a0188
JM
443int __mlx4_ib_query_pkey(struct ib_device *ibdev, u8 port, u16 index,
444 u16 *pkey, int netw_view)
225c7b1f
RD
445{
446 struct ib_smp *in_mad = NULL;
447 struct ib_smp *out_mad = NULL;
0a9a0188 448 int mad_ifc_flags = MLX4_MAD_IFC_IGNORE_KEYS;
225c7b1f
RD
449 int err = -ENOMEM;
450
451 in_mad = kzalloc(sizeof *in_mad, GFP_KERNEL);
452 out_mad = kmalloc(sizeof *out_mad, GFP_KERNEL);
453 if (!in_mad || !out_mad)
454 goto out;
455
456 init_query_mad(in_mad);
457 in_mad->attr_id = IB_SMP_ATTR_PKEY_TABLE;
458 in_mad->attr_mod = cpu_to_be32(index / 32);
459
0a9a0188
JM
460 if (mlx4_is_mfunc(to_mdev(ibdev)->dev) && netw_view)
461 mad_ifc_flags |= MLX4_MAD_IFC_NET_VIEW;
462
463 err = mlx4_MAD_IFC(to_mdev(ibdev), mad_ifc_flags, port, NULL, NULL,
464 in_mad, out_mad);
225c7b1f
RD
465 if (err)
466 goto out;
467
468 *pkey = be16_to_cpu(((__be16 *) out_mad->data)[index % 32]);
469
470out:
471 kfree(in_mad);
472 kfree(out_mad);
473 return err;
474}
475
0a9a0188
JM
476static int mlx4_ib_query_pkey(struct ib_device *ibdev, u8 port, u16 index, u16 *pkey)
477{
478 return __mlx4_ib_query_pkey(ibdev, port, index, pkey, 0);
479}
480
225c7b1f
RD
481static int mlx4_ib_modify_device(struct ib_device *ibdev, int mask,
482 struct ib_device_modify *props)
483{
d0d68b86 484 struct mlx4_cmd_mailbox *mailbox;
df7fba66 485 unsigned long flags;
d0d68b86 486
225c7b1f
RD
487 if (mask & ~IB_DEVICE_MODIFY_NODE_DESC)
488 return -EOPNOTSUPP;
489
d0d68b86
JM
490 if (!(mask & IB_DEVICE_MODIFY_NODE_DESC))
491 return 0;
492
992e8e6e
JM
493 if (mlx4_is_slave(to_mdev(ibdev)->dev))
494 return -EOPNOTSUPP;
495
df7fba66 496 spin_lock_irqsave(&to_mdev(ibdev)->sm_lock, flags);
d0d68b86 497 memcpy(ibdev->node_desc, props->node_desc, 64);
df7fba66 498 spin_unlock_irqrestore(&to_mdev(ibdev)->sm_lock, flags);
d0d68b86
JM
499
500 /*
501 * If possible, pass node desc to FW, so it can generate
502 * a 144 trap. If cmd fails, just ignore.
503 */
504 mailbox = mlx4_alloc_cmd_mailbox(to_mdev(ibdev)->dev);
505 if (IS_ERR(mailbox))
506 return 0;
507
508 memset(mailbox->buf, 0, 256);
509 memcpy(mailbox->buf, props->node_desc, 64);
510 mlx4_cmd(to_mdev(ibdev)->dev, mailbox->dma, 1, 0,
992e8e6e 511 MLX4_CMD_SET_NODE, MLX4_CMD_TIME_CLASS_A, MLX4_CMD_NATIVE);
d0d68b86
JM
512
513 mlx4_free_cmd_mailbox(to_mdev(ibdev)->dev, mailbox);
225c7b1f
RD
514
515 return 0;
516}
517
518static int mlx4_SET_PORT(struct mlx4_ib_dev *dev, u8 port, int reset_qkey_viols,
519 u32 cap_mask)
520{
521 struct mlx4_cmd_mailbox *mailbox;
522 int err;
fa417f7b 523 u8 is_eth = dev->dev->caps.port_type[port] == MLX4_PORT_TYPE_ETH;
225c7b1f
RD
524
525 mailbox = mlx4_alloc_cmd_mailbox(dev->dev);
526 if (IS_ERR(mailbox))
527 return PTR_ERR(mailbox);
528
529 memset(mailbox->buf, 0, 256);
5ae2a7a8
RD
530
531 if (dev->dev->flags & MLX4_FLAG_OLD_PORT_CMDS) {
532 *(u8 *) mailbox->buf = !!reset_qkey_viols << 6;
533 ((__be32 *) mailbox->buf)[2] = cpu_to_be32(cap_mask);
534 } else {
535 ((u8 *) mailbox->buf)[3] = !!reset_qkey_viols;
536 ((__be32 *) mailbox->buf)[1] = cpu_to_be32(cap_mask);
537 }
225c7b1f 538
fa417f7b 539 err = mlx4_cmd(dev->dev, mailbox->dma, port, is_eth, MLX4_CMD_SET_PORT,
f9baff50 540 MLX4_CMD_TIME_CLASS_B, MLX4_CMD_NATIVE);
225c7b1f
RD
541
542 mlx4_free_cmd_mailbox(dev->dev, mailbox);
543 return err;
544}
545
546static int mlx4_ib_modify_port(struct ib_device *ibdev, u8 port, int mask,
547 struct ib_port_modify *props)
548{
549 struct ib_port_attr attr;
550 u32 cap_mask;
551 int err;
552
553 mutex_lock(&to_mdev(ibdev)->cap_mask_mutex);
554
555 err = mlx4_ib_query_port(ibdev, port, &attr);
556 if (err)
557 goto out;
558
559 cap_mask = (attr.port_cap_flags | props->set_port_cap_mask) &
560 ~props->clr_port_cap_mask;
561
562 err = mlx4_SET_PORT(to_mdev(ibdev), port,
563 !!(mask & IB_PORT_RESET_QKEY_CNTR),
564 cap_mask);
565
566out:
567 mutex_unlock(&to_mdev(ibdev)->cap_mask_mutex);
568 return err;
569}
570
571static struct ib_ucontext *mlx4_ib_alloc_ucontext(struct ib_device *ibdev,
572 struct ib_udata *udata)
573{
574 struct mlx4_ib_dev *dev = to_mdev(ibdev);
575 struct mlx4_ib_ucontext *context;
08ff3235 576 struct mlx4_ib_alloc_ucontext_resp_v3 resp_v3;
225c7b1f
RD
577 struct mlx4_ib_alloc_ucontext_resp resp;
578 int err;
579
3b4a8cd5
JM
580 if (!dev->ib_active)
581 return ERR_PTR(-EAGAIN);
582
08ff3235
OG
583 if (ibdev->uverbs_abi_ver == MLX4_IB_UVERBS_NO_DEV_CAPS_ABI_VERSION) {
584 resp_v3.qp_tab_size = dev->dev->caps.num_qps;
585 resp_v3.bf_reg_size = dev->dev->caps.bf_reg_size;
586 resp_v3.bf_regs_per_page = dev->dev->caps.bf_regs_per_page;
587 } else {
588 resp.dev_caps = dev->dev->caps.userspace_caps;
589 resp.qp_tab_size = dev->dev->caps.num_qps;
590 resp.bf_reg_size = dev->dev->caps.bf_reg_size;
591 resp.bf_regs_per_page = dev->dev->caps.bf_regs_per_page;
592 resp.cqe_size = dev->dev->caps.cqe_size;
593 }
225c7b1f
RD
594
595 context = kmalloc(sizeof *context, GFP_KERNEL);
596 if (!context)
597 return ERR_PTR(-ENOMEM);
598
599 err = mlx4_uar_alloc(to_mdev(ibdev)->dev, &context->uar);
600 if (err) {
601 kfree(context);
602 return ERR_PTR(err);
603 }
604
605 INIT_LIST_HEAD(&context->db_page_list);
606 mutex_init(&context->db_page_mutex);
607
08ff3235
OG
608 if (ibdev->uverbs_abi_ver == MLX4_IB_UVERBS_NO_DEV_CAPS_ABI_VERSION)
609 err = ib_copy_to_udata(udata, &resp_v3, sizeof(resp_v3));
610 else
611 err = ib_copy_to_udata(udata, &resp, sizeof(resp));
612
225c7b1f
RD
613 if (err) {
614 mlx4_uar_free(to_mdev(ibdev)->dev, &context->uar);
615 kfree(context);
616 return ERR_PTR(-EFAULT);
617 }
618
619 return &context->ibucontext;
620}
621
622static int mlx4_ib_dealloc_ucontext(struct ib_ucontext *ibcontext)
623{
624 struct mlx4_ib_ucontext *context = to_mucontext(ibcontext);
625
626 mlx4_uar_free(to_mdev(ibcontext->device)->dev, &context->uar);
627 kfree(context);
628
629 return 0;
630}
631
632static int mlx4_ib_mmap(struct ib_ucontext *context, struct vm_area_struct *vma)
633{
634 struct mlx4_ib_dev *dev = to_mdev(context->device);
635
636 if (vma->vm_end - vma->vm_start != PAGE_SIZE)
637 return -EINVAL;
638
639 if (vma->vm_pgoff == 0) {
640 vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot);
641
642 if (io_remap_pfn_range(vma, vma->vm_start,
643 to_mucontext(context)->uar.pfn,
644 PAGE_SIZE, vma->vm_page_prot))
645 return -EAGAIN;
646 } else if (vma->vm_pgoff == 1 && dev->dev->caps.bf_reg_size != 0) {
e1d60ec6 647 vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
225c7b1f
RD
648
649 if (io_remap_pfn_range(vma, vma->vm_start,
650 to_mucontext(context)->uar.pfn +
651 dev->dev->caps.num_uars,
652 PAGE_SIZE, vma->vm_page_prot))
653 return -EAGAIN;
654 } else
655 return -EINVAL;
656
657 return 0;
658}
659
660static struct ib_pd *mlx4_ib_alloc_pd(struct ib_device *ibdev,
661 struct ib_ucontext *context,
662 struct ib_udata *udata)
663{
664 struct mlx4_ib_pd *pd;
665 int err;
666
667 pd = kmalloc(sizeof *pd, GFP_KERNEL);
668 if (!pd)
669 return ERR_PTR(-ENOMEM);
670
671 err = mlx4_pd_alloc(to_mdev(ibdev)->dev, &pd->pdn);
672 if (err) {
673 kfree(pd);
674 return ERR_PTR(err);
675 }
676
677 if (context)
678 if (ib_copy_to_udata(udata, &pd->pdn, sizeof (__u32))) {
679 mlx4_pd_free(to_mdev(ibdev)->dev, pd->pdn);
680 kfree(pd);
681 return ERR_PTR(-EFAULT);
682 }
683
684 return &pd->ibpd;
685}
686
687static int mlx4_ib_dealloc_pd(struct ib_pd *pd)
688{
689 mlx4_pd_free(to_mdev(pd->device)->dev, to_mpd(pd)->pdn);
690 kfree(pd);
691
692 return 0;
693}
694
012a8ff5
SH
695static struct ib_xrcd *mlx4_ib_alloc_xrcd(struct ib_device *ibdev,
696 struct ib_ucontext *context,
697 struct ib_udata *udata)
698{
699 struct mlx4_ib_xrcd *xrcd;
700 int err;
701
702 if (!(to_mdev(ibdev)->dev->caps.flags & MLX4_DEV_CAP_FLAG_XRC))
703 return ERR_PTR(-ENOSYS);
704
705 xrcd = kmalloc(sizeof *xrcd, GFP_KERNEL);
706 if (!xrcd)
707 return ERR_PTR(-ENOMEM);
708
709 err = mlx4_xrcd_alloc(to_mdev(ibdev)->dev, &xrcd->xrcdn);
710 if (err)
711 goto err1;
712
713 xrcd->pd = ib_alloc_pd(ibdev);
714 if (IS_ERR(xrcd->pd)) {
715 err = PTR_ERR(xrcd->pd);
716 goto err2;
717 }
718
719 xrcd->cq = ib_create_cq(ibdev, NULL, NULL, xrcd, 1, 0);
720 if (IS_ERR(xrcd->cq)) {
721 err = PTR_ERR(xrcd->cq);
722 goto err3;
723 }
724
725 return &xrcd->ibxrcd;
726
727err3:
728 ib_dealloc_pd(xrcd->pd);
729err2:
730 mlx4_xrcd_free(to_mdev(ibdev)->dev, xrcd->xrcdn);
731err1:
732 kfree(xrcd);
733 return ERR_PTR(err);
734}
735
736static int mlx4_ib_dealloc_xrcd(struct ib_xrcd *xrcd)
737{
738 ib_destroy_cq(to_mxrcd(xrcd)->cq);
739 ib_dealloc_pd(to_mxrcd(xrcd)->pd);
740 mlx4_xrcd_free(to_mdev(xrcd->device)->dev, to_mxrcd(xrcd)->xrcdn);
741 kfree(xrcd);
742
743 return 0;
744}
745
fa417f7b
EC
746static int add_gid_entry(struct ib_qp *ibqp, union ib_gid *gid)
747{
748 struct mlx4_ib_qp *mqp = to_mqp(ibqp);
749 struct mlx4_ib_dev *mdev = to_mdev(ibqp->device);
750 struct mlx4_ib_gid_entry *ge;
751
752 ge = kzalloc(sizeof *ge, GFP_KERNEL);
753 if (!ge)
754 return -ENOMEM;
755
756 ge->gid = *gid;
757 if (mlx4_ib_add_mc(mdev, mqp, gid)) {
758 ge->port = mqp->port;
759 ge->added = 1;
760 }
761
762 mutex_lock(&mqp->mutex);
763 list_add_tail(&ge->list, &mqp->gid_list);
764 mutex_unlock(&mqp->mutex);
765
766 return 0;
767}
768
769int mlx4_ib_add_mc(struct mlx4_ib_dev *mdev, struct mlx4_ib_qp *mqp,
770 union ib_gid *gid)
771{
772 u8 mac[6];
773 struct net_device *ndev;
774 int ret = 0;
775
776 if (!mqp->port)
777 return 0;
778
779 spin_lock(&mdev->iboe.lock);
780 ndev = mdev->iboe.netdevs[mqp->port - 1];
781 if (ndev)
782 dev_hold(ndev);
783 spin_unlock(&mdev->iboe.lock);
784
785 if (ndev) {
786 rdma_get_mcast_mac((struct in6_addr *)gid, mac);
787 rtnl_lock();
788 dev_mc_add(mdev->iboe.netdevs[mqp->port - 1], mac);
789 ret = 1;
790 rtnl_unlock();
791 dev_put(ndev);
792 }
793
794 return ret;
795}
796
0ff1fb65
HHZ
797struct mlx4_ib_steering {
798 struct list_head list;
799 u64 reg_id;
800 union ib_gid gid;
801};
802
225c7b1f
RD
803static int mlx4_ib_mcg_attach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
804{
fa417f7b
EC
805 int err;
806 struct mlx4_ib_dev *mdev = to_mdev(ibqp->device);
807 struct mlx4_ib_qp *mqp = to_mqp(ibqp);
0ff1fb65
HHZ
808 u64 reg_id;
809 struct mlx4_ib_steering *ib_steering = NULL;
810
811 if (mdev->dev->caps.steering_mode ==
812 MLX4_STEERING_MODE_DEVICE_MANAGED) {
813 ib_steering = kmalloc(sizeof(*ib_steering), GFP_KERNEL);
814 if (!ib_steering)
815 return -ENOMEM;
816 }
fa417f7b 817
0ff1fb65
HHZ
818 err = mlx4_multicast_attach(mdev->dev, &mqp->mqp, gid->raw, mqp->port,
819 !!(mqp->flags &
820 MLX4_IB_QP_BLOCK_MULTICAST_LOOPBACK),
821 MLX4_PROT_IB_IPV6, &reg_id);
fa417f7b 822 if (err)
0ff1fb65 823 goto err_malloc;
fa417f7b
EC
824
825 err = add_gid_entry(ibqp, gid);
826 if (err)
827 goto err_add;
828
0ff1fb65
HHZ
829 if (ib_steering) {
830 memcpy(ib_steering->gid.raw, gid->raw, 16);
831 ib_steering->reg_id = reg_id;
832 mutex_lock(&mqp->mutex);
833 list_add(&ib_steering->list, &mqp->steering_rules);
834 mutex_unlock(&mqp->mutex);
835 }
fa417f7b
EC
836 return 0;
837
838err_add:
0ff1fb65
HHZ
839 mlx4_multicast_detach(mdev->dev, &mqp->mqp, gid->raw,
840 MLX4_PROT_IB_IPV6, reg_id);
841err_malloc:
842 kfree(ib_steering);
843
fa417f7b
EC
844 return err;
845}
846
847static struct mlx4_ib_gid_entry *find_gid_entry(struct mlx4_ib_qp *qp, u8 *raw)
848{
849 struct mlx4_ib_gid_entry *ge;
850 struct mlx4_ib_gid_entry *tmp;
851 struct mlx4_ib_gid_entry *ret = NULL;
852
853 list_for_each_entry_safe(ge, tmp, &qp->gid_list, list) {
854 if (!memcmp(raw, ge->gid.raw, 16)) {
855 ret = ge;
856 break;
857 }
858 }
859
860 return ret;
225c7b1f
RD
861}
862
863static int mlx4_ib_mcg_detach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
864{
fa417f7b
EC
865 int err;
866 struct mlx4_ib_dev *mdev = to_mdev(ibqp->device);
867 struct mlx4_ib_qp *mqp = to_mqp(ibqp);
868 u8 mac[6];
869 struct net_device *ndev;
870 struct mlx4_ib_gid_entry *ge;
0ff1fb65
HHZ
871 u64 reg_id = 0;
872
873 if (mdev->dev->caps.steering_mode ==
874 MLX4_STEERING_MODE_DEVICE_MANAGED) {
875 struct mlx4_ib_steering *ib_steering;
876
877 mutex_lock(&mqp->mutex);
878 list_for_each_entry(ib_steering, &mqp->steering_rules, list) {
879 if (!memcmp(ib_steering->gid.raw, gid->raw, 16)) {
880 list_del(&ib_steering->list);
881 break;
882 }
883 }
884 mutex_unlock(&mqp->mutex);
885 if (&ib_steering->list == &mqp->steering_rules) {
886 pr_err("Couldn't find reg_id for mgid. Steering rule is left attached\n");
887 return -EINVAL;
888 }
889 reg_id = ib_steering->reg_id;
890 kfree(ib_steering);
891 }
fa417f7b 892
0ff1fb65
HHZ
893 err = mlx4_multicast_detach(mdev->dev, &mqp->mqp, gid->raw,
894 MLX4_PROT_IB_IPV6, reg_id);
fa417f7b
EC
895 if (err)
896 return err;
897
898 mutex_lock(&mqp->mutex);
899 ge = find_gid_entry(mqp, gid->raw);
900 if (ge) {
901 spin_lock(&mdev->iboe.lock);
902 ndev = ge->added ? mdev->iboe.netdevs[ge->port - 1] : NULL;
903 if (ndev)
904 dev_hold(ndev);
905 spin_unlock(&mdev->iboe.lock);
906 rdma_get_mcast_mac((struct in6_addr *)gid, mac);
907 if (ndev) {
908 rtnl_lock();
909 dev_mc_del(mdev->iboe.netdevs[ge->port - 1], mac);
910 rtnl_unlock();
911 dev_put(ndev);
912 }
913 list_del(&ge->list);
914 kfree(ge);
915 } else
987c8f8f 916 pr_warn("could not find mgid entry\n");
fa417f7b
EC
917
918 mutex_unlock(&mqp->mutex);
919
920 return 0;
225c7b1f
RD
921}
922
923static int init_node_data(struct mlx4_ib_dev *dev)
924{
925 struct ib_smp *in_mad = NULL;
926 struct ib_smp *out_mad = NULL;
0a9a0188 927 int mad_ifc_flags = MLX4_MAD_IFC_IGNORE_KEYS;
225c7b1f
RD
928 int err = -ENOMEM;
929
930 in_mad = kzalloc(sizeof *in_mad, GFP_KERNEL);
931 out_mad = kmalloc(sizeof *out_mad, GFP_KERNEL);
932 if (!in_mad || !out_mad)
933 goto out;
934
935 init_query_mad(in_mad);
936 in_mad->attr_id = IB_SMP_ATTR_NODE_DESC;
0a9a0188
JM
937 if (mlx4_is_master(dev->dev))
938 mad_ifc_flags |= MLX4_MAD_IFC_NET_VIEW;
225c7b1f 939
0a9a0188 940 err = mlx4_MAD_IFC(dev, mad_ifc_flags, 1, NULL, NULL, in_mad, out_mad);
225c7b1f
RD
941 if (err)
942 goto out;
943
944 memcpy(dev->ib_dev.node_desc, out_mad->data, 64);
945
946 in_mad->attr_id = IB_SMP_ATTR_NODE_INFO;
947
0a9a0188 948 err = mlx4_MAD_IFC(dev, mad_ifc_flags, 1, NULL, NULL, in_mad, out_mad);
225c7b1f
RD
949 if (err)
950 goto out;
951
992e8e6e 952 dev->dev->rev_id = be32_to_cpup((__be32 *) (out_mad->data + 32));
225c7b1f
RD
953 memcpy(&dev->ib_dev.node_guid, out_mad->data + 12, 8);
954
955out:
956 kfree(in_mad);
957 kfree(out_mad);
958 return err;
959}
960
f4e91eb4
TJ
961static ssize_t show_hca(struct device *device, struct device_attribute *attr,
962 char *buf)
cd9281d8 963{
f4e91eb4
TJ
964 struct mlx4_ib_dev *dev =
965 container_of(device, struct mlx4_ib_dev, ib_dev.dev);
cd9281d8
JM
966 return sprintf(buf, "MT%d\n", dev->dev->pdev->device);
967}
968
f4e91eb4
TJ
969static ssize_t show_fw_ver(struct device *device, struct device_attribute *attr,
970 char *buf)
cd9281d8 971{
f4e91eb4
TJ
972 struct mlx4_ib_dev *dev =
973 container_of(device, struct mlx4_ib_dev, ib_dev.dev);
cd9281d8
JM
974 return sprintf(buf, "%d.%d.%d\n", (int) (dev->dev->caps.fw_ver >> 32),
975 (int) (dev->dev->caps.fw_ver >> 16) & 0xffff,
976 (int) dev->dev->caps.fw_ver & 0xffff);
977}
978
f4e91eb4
TJ
979static ssize_t show_rev(struct device *device, struct device_attribute *attr,
980 char *buf)
cd9281d8 981{
f4e91eb4
TJ
982 struct mlx4_ib_dev *dev =
983 container_of(device, struct mlx4_ib_dev, ib_dev.dev);
cd9281d8
JM
984 return sprintf(buf, "%x\n", dev->dev->rev_id);
985}
986
f4e91eb4
TJ
987static ssize_t show_board(struct device *device, struct device_attribute *attr,
988 char *buf)
cd9281d8 989{
f4e91eb4
TJ
990 struct mlx4_ib_dev *dev =
991 container_of(device, struct mlx4_ib_dev, ib_dev.dev);
992 return sprintf(buf, "%.*s\n", MLX4_BOARD_ID_LEN,
993 dev->dev->board_id);
cd9281d8
JM
994}
995
f4e91eb4
TJ
996static DEVICE_ATTR(hw_rev, S_IRUGO, show_rev, NULL);
997static DEVICE_ATTR(fw_ver, S_IRUGO, show_fw_ver, NULL);
998static DEVICE_ATTR(hca_type, S_IRUGO, show_hca, NULL);
999static DEVICE_ATTR(board_id, S_IRUGO, show_board, NULL);
cd9281d8 1000
f4e91eb4
TJ
1001static struct device_attribute *mlx4_class_attributes[] = {
1002 &dev_attr_hw_rev,
1003 &dev_attr_fw_ver,
1004 &dev_attr_hca_type,
1005 &dev_attr_board_id
cd9281d8
JM
1006};
1007
4c3eb3ca 1008static void mlx4_addrconf_ifid_eui48(u8 *eui, u16 vlan_id, struct net_device *dev)
fa417f7b
EC
1009{
1010 memcpy(eui, dev->dev_addr, 3);
1011 memcpy(eui + 5, dev->dev_addr + 3, 3);
4c3eb3ca
EC
1012 if (vlan_id < 0x1000) {
1013 eui[3] = vlan_id >> 8;
1014 eui[4] = vlan_id & 0xff;
1015 } else {
1016 eui[3] = 0xff;
1017 eui[4] = 0xfe;
1018 }
fa417f7b
EC
1019 eui[0] ^= 2;
1020}
1021
1022static void update_gids_task(struct work_struct *work)
1023{
1024 struct update_gid_work *gw = container_of(work, struct update_gid_work, work);
1025 struct mlx4_cmd_mailbox *mailbox;
1026 union ib_gid *gids;
1027 int err;
1028 struct mlx4_dev *dev = gw->dev->dev;
fa417f7b
EC
1029
1030 mailbox = mlx4_alloc_cmd_mailbox(dev);
1031 if (IS_ERR(mailbox)) {
987c8f8f 1032 pr_warn("update gid table failed %ld\n", PTR_ERR(mailbox));
fa417f7b
EC
1033 return;
1034 }
1035
1036 gids = mailbox->buf;
1037 memcpy(gids, gw->gids, sizeof gw->gids);
1038
1039 err = mlx4_cmd(dev, mailbox->dma, MLX4_SET_PORT_GID_TABLE << 8 | gw->port,
f9baff50 1040 1, MLX4_CMD_SET_PORT, MLX4_CMD_TIME_CLASS_B,
992e8e6e 1041 MLX4_CMD_WRAPPED);
fa417f7b 1042 if (err)
987c8f8f 1043 pr_warn("set port command failed\n");
fa417f7b
EC
1044 else {
1045 memcpy(gw->dev->iboe.gid_table[gw->port - 1], gw->gids, sizeof gw->gids);
00f5ce99 1046 mlx4_ib_dispatch_event(gw->dev, gw->port, IB_EVENT_GID_CHANGE);
fa417f7b
EC
1047 }
1048
1049 mlx4_free_cmd_mailbox(dev, mailbox);
1050 kfree(gw);
1051}
1052
1053static int update_ipv6_gids(struct mlx4_ib_dev *dev, int port, int clear)
1054{
1055 struct net_device *ndev = dev->iboe.netdevs[port - 1];
1056 struct update_gid_work *work;
4c3eb3ca
EC
1057 struct net_device *tmp;
1058 int i;
1059 u8 *hits;
1060 int ret;
1061 union ib_gid gid;
1062 int free;
1063 int found;
1064 int need_update = 0;
1065 u16 vid;
fa417f7b
EC
1066
1067 work = kzalloc(sizeof *work, GFP_ATOMIC);
1068 if (!work)
1069 return -ENOMEM;
1070
4c3eb3ca
EC
1071 hits = kzalloc(128, GFP_ATOMIC);
1072 if (!hits) {
1073 ret = -ENOMEM;
1074 goto out;
1075 }
1076
22f4fbd9
ED
1077 rcu_read_lock();
1078 for_each_netdev_rcu(&init_net, tmp) {
4c3eb3ca
EC
1079 if (ndev && (tmp == ndev || rdma_vlan_dev_real_dev(tmp) == ndev)) {
1080 gid.global.subnet_prefix = cpu_to_be64(0xfe80000000000000LL);
1081 vid = rdma_vlan_dev_vlan_id(tmp);
1082 mlx4_addrconf_ifid_eui48(&gid.raw[8], vid, ndev);
1083 found = 0;
1084 free = -1;
1085 for (i = 0; i < 128; ++i) {
1086 if (free < 0 &&
1087 !memcmp(&dev->iboe.gid_table[port - 1][i], &zgid, sizeof zgid))
1088 free = i;
1089 if (!memcmp(&dev->iboe.gid_table[port - 1][i], &gid, sizeof gid)) {
1090 hits[i] = 1;
1091 found = 1;
1092 break;
1093 }
1094 }
1095
1096 if (!found) {
1097 if (tmp == ndev &&
1098 (memcmp(&dev->iboe.gid_table[port - 1][0],
1099 &gid, sizeof gid) ||
1100 !memcmp(&dev->iboe.gid_table[port - 1][0],
1101 &zgid, sizeof gid))) {
1102 dev->iboe.gid_table[port - 1][0] = gid;
1103 ++need_update;
1104 hits[0] = 1;
1105 } else if (free >= 0) {
1106 dev->iboe.gid_table[port - 1][free] = gid;
1107 hits[free] = 1;
1108 ++need_update;
1109 }
1110 }
1111 }
fa417f7b 1112 }
22f4fbd9 1113 rcu_read_unlock();
4c3eb3ca
EC
1114
1115 for (i = 0; i < 128; ++i)
1116 if (!hits[i]) {
1117 if (memcmp(&dev->iboe.gid_table[port - 1][i], &zgid, sizeof zgid))
1118 ++need_update;
1119 dev->iboe.gid_table[port - 1][i] = zgid;
1120 }
fa417f7b 1121
4c3eb3ca
EC
1122 if (need_update) {
1123 memcpy(work->gids, dev->iboe.gid_table[port - 1], sizeof work->gids);
1124 INIT_WORK(&work->work, update_gids_task);
1125 work->port = port;
1126 work->dev = dev;
1127 queue_work(wq, &work->work);
1128 } else
1129 kfree(work);
fa417f7b 1130
4c3eb3ca 1131 kfree(hits);
fa417f7b 1132 return 0;
4c3eb3ca
EC
1133
1134out:
1135 kfree(work);
1136 return ret;
fa417f7b
EC
1137}
1138
1139static void handle_en_event(struct mlx4_ib_dev *dev, int port, unsigned long event)
1140{
1141 switch (event) {
1142 case NETDEV_UP:
4c3eb3ca 1143 case NETDEV_CHANGEADDR:
fa417f7b
EC
1144 update_ipv6_gids(dev, port, 0);
1145 break;
1146
1147 case NETDEV_DOWN:
1148 update_ipv6_gids(dev, port, 1);
1149 dev->iboe.netdevs[port - 1] = NULL;
1150 }
1151}
1152
1153static void netdev_added(struct mlx4_ib_dev *dev, int port)
1154{
1155 update_ipv6_gids(dev, port, 0);
1156}
1157
1158static void netdev_removed(struct mlx4_ib_dev *dev, int port)
1159{
1160 update_ipv6_gids(dev, port, 1);
1161}
1162
1163static int mlx4_ib_netdev_event(struct notifier_block *this, unsigned long event,
1164 void *ptr)
1165{
1166 struct net_device *dev = ptr;
1167 struct mlx4_ib_dev *ibdev;
1168 struct net_device *oldnd;
1169 struct mlx4_ib_iboe *iboe;
1170 int port;
1171
1172 if (!net_eq(dev_net(dev), &init_net))
1173 return NOTIFY_DONE;
1174
1175 ibdev = container_of(this, struct mlx4_ib_dev, iboe.nb);
1176 iboe = &ibdev->iboe;
1177
1178 spin_lock(&iboe->lock);
1179 mlx4_foreach_ib_transport_port(port, ibdev->dev) {
1180 oldnd = iboe->netdevs[port - 1];
1181 iboe->netdevs[port - 1] =
0345584e 1182 mlx4_get_protocol_dev(ibdev->dev, MLX4_PROT_ETH, port);
fa417f7b
EC
1183 if (oldnd != iboe->netdevs[port - 1]) {
1184 if (iboe->netdevs[port - 1])
1185 netdev_added(ibdev, port);
1186 else
1187 netdev_removed(ibdev, port);
1188 }
1189 }
1190
4c3eb3ca
EC
1191 if (dev == iboe->netdevs[0] ||
1192 (iboe->netdevs[0] && rdma_vlan_dev_real_dev(dev) == iboe->netdevs[0]))
fa417f7b 1193 handle_en_event(ibdev, 1, event);
4c3eb3ca
EC
1194 else if (dev == iboe->netdevs[1]
1195 || (iboe->netdevs[1] && rdma_vlan_dev_real_dev(dev) == iboe->netdevs[1]))
fa417f7b
EC
1196 handle_en_event(ibdev, 2, event);
1197
1198 spin_unlock(&iboe->lock);
1199
1200 return NOTIFY_DONE;
1201}
1202
54679e14
JM
1203static void init_pkeys(struct mlx4_ib_dev *ibdev)
1204{
1205 int port;
1206 int slave;
1207 int i;
1208
1209 if (mlx4_is_master(ibdev->dev)) {
1210 for (slave = 0; slave <= ibdev->dev->num_vfs; ++slave) {
1211 for (port = 1; port <= ibdev->dev->caps.num_ports; ++port) {
1212 for (i = 0;
1213 i < ibdev->dev->phys_caps.pkey_phys_table_len[port];
1214 ++i) {
1215 ibdev->pkeys.virt2phys_pkey[slave][port - 1][i] =
1216 /* master has the identity virt2phys pkey mapping */
1217 (slave == mlx4_master_func_num(ibdev->dev) || !i) ? i :
1218 ibdev->dev->phys_caps.pkey_phys_table_len[port] - 1;
1219 mlx4_sync_pkey_table(ibdev->dev, slave, port, i,
1220 ibdev->pkeys.virt2phys_pkey[slave][port - 1][i]);
1221 }
1222 }
1223 }
1224 /* initialize pkey cache */
1225 for (port = 1; port <= ibdev->dev->caps.num_ports; ++port) {
1226 for (i = 0;
1227 i < ibdev->dev->phys_caps.pkey_phys_table_len[port];
1228 ++i)
1229 ibdev->pkeys.phys_pkey_cache[port-1][i] =
1230 (i) ? 0 : 0xFFFF;
1231 }
1232 }
1233}
1234
e605b743
SP
1235static void mlx4_ib_alloc_eqs(struct mlx4_dev *dev, struct mlx4_ib_dev *ibdev)
1236{
1237 char name[32];
1238 int eq_per_port = 0;
1239 int added_eqs = 0;
1240 int total_eqs = 0;
1241 int i, j, eq;
1242
3aac6ff1
SP
1243 /* Legacy mode or comp_pool is not large enough */
1244 if (dev->caps.comp_pool == 0 ||
1245 dev->caps.num_ports > dev->caps.comp_pool)
e605b743
SP
1246 return;
1247
1248 eq_per_port = rounddown_pow_of_two(dev->caps.comp_pool/
1249 dev->caps.num_ports);
1250
1251 /* Init eq table */
1252 added_eqs = 0;
1253 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_IB)
1254 added_eqs += eq_per_port;
1255
1256 total_eqs = dev->caps.num_comp_vectors + added_eqs;
1257
1258 ibdev->eq_table = kzalloc(total_eqs * sizeof(int), GFP_KERNEL);
1259 if (!ibdev->eq_table)
1260 return;
1261
1262 ibdev->eq_added = added_eqs;
1263
1264 eq = 0;
1265 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_IB) {
1266 for (j = 0; j < eq_per_port; j++) {
1267 sprintf(name, "mlx4-ib-%d-%d@%s",
1268 i, j, dev->pdev->bus->name);
1269 /* Set IRQ for specific name (per ring) */
d9236c3f
AV
1270 if (mlx4_assign_eq(dev, name, NULL,
1271 &ibdev->eq_table[eq])) {
e605b743
SP
1272 /* Use legacy (same as mlx4_en driver) */
1273 pr_warn("Can't allocate EQ %d; reverting to legacy\n", eq);
1274 ibdev->eq_table[eq] =
1275 (eq % dev->caps.num_comp_vectors);
1276 }
1277 eq++;
1278 }
1279 }
1280
1281 /* Fill the reset of the vector with legacy EQ */
1282 for (i = 0, eq = added_eqs; i < dev->caps.num_comp_vectors; i++)
1283 ibdev->eq_table[eq++] = i;
1284
1285 /* Advertise the new number of EQs to clients */
1286 ibdev->ib_dev.num_comp_vectors = total_eqs;
1287}
1288
1289static void mlx4_ib_free_eqs(struct mlx4_dev *dev, struct mlx4_ib_dev *ibdev)
1290{
1291 int i;
3aac6ff1
SP
1292
1293 /* no additional eqs were added */
1294 if (!ibdev->eq_table)
1295 return;
e605b743
SP
1296
1297 /* Reset the advertised EQ number */
1298 ibdev->ib_dev.num_comp_vectors = dev->caps.num_comp_vectors;
1299
1300 /* Free only the added eqs */
1301 for (i = 0; i < ibdev->eq_added; i++) {
1302 /* Don't free legacy eqs if used */
1303 if (ibdev->eq_table[i] <= dev->caps.num_comp_vectors)
1304 continue;
1305 mlx4_release_eq(dev, ibdev->eq_table[i]);
1306 }
1307
e605b743 1308 kfree(ibdev->eq_table);
e605b743
SP
1309}
1310
225c7b1f
RD
1311static void *mlx4_ib_add(struct mlx4_dev *dev)
1312{
1313 struct mlx4_ib_dev *ibdev;
22e7ef9c 1314 int num_ports = 0;
035b1032 1315 int i, j;
fa417f7b
EC
1316 int err;
1317 struct mlx4_ib_iboe *iboe;
225c7b1f 1318
987c8f8f 1319 pr_info_once("%s", mlx4_ib_version);
68f3948d 1320
026149cb
JM
1321 mlx4_foreach_non_ib_transport_port(i, dev)
1322 num_ports++;
1323
1324 if (mlx4_is_mfunc(dev) && num_ports) {
1325 dev_err(&dev->pdev->dev, "RoCE is not supported over SRIOV as yet\n");
8e59d254
JM
1326 return NULL;
1327 }
1328
026149cb 1329 num_ports = 0;
fa417f7b 1330 mlx4_foreach_ib_transport_port(i, dev)
22e7ef9c
RD
1331 num_ports++;
1332
1333 /* No point in registering a device with no ports... */
1334 if (num_ports == 0)
1335 return NULL;
1336
225c7b1f
RD
1337 ibdev = (struct mlx4_ib_dev *) ib_alloc_device(sizeof *ibdev);
1338 if (!ibdev) {
1339 dev_err(&dev->pdev->dev, "Device struct alloc failed\n");
1340 return NULL;
1341 }
1342
fa417f7b
EC
1343 iboe = &ibdev->iboe;
1344
225c7b1f
RD
1345 if (mlx4_pd_alloc(dev, &ibdev->priv_pdn))
1346 goto err_dealloc;
1347
1348 if (mlx4_uar_alloc(dev, &ibdev->priv_uar))
1349 goto err_pd;
1350
4979d18f
RD
1351 ibdev->uar_map = ioremap((phys_addr_t) ibdev->priv_uar.pfn << PAGE_SHIFT,
1352 PAGE_SIZE);
225c7b1f
RD
1353 if (!ibdev->uar_map)
1354 goto err_uar;
26c6bc7b 1355 MLX4_INIT_DOORBELL_LOCK(&ibdev->uar_lock);
225c7b1f 1356
225c7b1f
RD
1357 ibdev->dev = dev;
1358
1359 strlcpy(ibdev->ib_dev.name, "mlx4_%d", IB_DEVICE_NAME_MAX);
1360 ibdev->ib_dev.owner = THIS_MODULE;
1361 ibdev->ib_dev.node_type = RDMA_NODE_IB_CA;
95d04f07 1362 ibdev->ib_dev.local_dma_lkey = dev->caps.reserved_lkey;
22e7ef9c 1363 ibdev->num_ports = num_ports;
7ff93f8b 1364 ibdev->ib_dev.phys_port_cnt = ibdev->num_ports;
b8dd786f 1365 ibdev->ib_dev.num_comp_vectors = dev->caps.num_comp_vectors;
225c7b1f
RD
1366 ibdev->ib_dev.dma_device = &dev->pdev->dev;
1367
08ff3235
OG
1368 if (dev->caps.userspace_caps)
1369 ibdev->ib_dev.uverbs_abi_ver = MLX4_IB_UVERBS_ABI_VERSION;
1370 else
1371 ibdev->ib_dev.uverbs_abi_ver = MLX4_IB_UVERBS_NO_DEV_CAPS_ABI_VERSION;
1372
225c7b1f
RD
1373 ibdev->ib_dev.uverbs_cmd_mask =
1374 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT) |
1375 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE) |
1376 (1ull << IB_USER_VERBS_CMD_QUERY_PORT) |
1377 (1ull << IB_USER_VERBS_CMD_ALLOC_PD) |
1378 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD) |
1379 (1ull << IB_USER_VERBS_CMD_REG_MR) |
1380 (1ull << IB_USER_VERBS_CMD_DEREG_MR) |
1381 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
1382 (1ull << IB_USER_VERBS_CMD_CREATE_CQ) |
bbf8eed1 1383 (1ull << IB_USER_VERBS_CMD_RESIZE_CQ) |
225c7b1f
RD
1384 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ) |
1385 (1ull << IB_USER_VERBS_CMD_CREATE_QP) |
1386 (1ull << IB_USER_VERBS_CMD_MODIFY_QP) |
6a775e2b 1387 (1ull << IB_USER_VERBS_CMD_QUERY_QP) |
225c7b1f
RD
1388 (1ull << IB_USER_VERBS_CMD_DESTROY_QP) |
1389 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST) |
1390 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST) |
1391 (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
1392 (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
65541cb7 1393 (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
18abd5ea 1394 (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ) |
42849b26
SH
1395 (1ull << IB_USER_VERBS_CMD_CREATE_XSRQ) |
1396 (1ull << IB_USER_VERBS_CMD_OPEN_QP);
225c7b1f
RD
1397
1398 ibdev->ib_dev.query_device = mlx4_ib_query_device;
1399 ibdev->ib_dev.query_port = mlx4_ib_query_port;
fa417f7b 1400 ibdev->ib_dev.get_link_layer = mlx4_ib_port_link_layer;
225c7b1f
RD
1401 ibdev->ib_dev.query_gid = mlx4_ib_query_gid;
1402 ibdev->ib_dev.query_pkey = mlx4_ib_query_pkey;
1403 ibdev->ib_dev.modify_device = mlx4_ib_modify_device;
1404 ibdev->ib_dev.modify_port = mlx4_ib_modify_port;
1405 ibdev->ib_dev.alloc_ucontext = mlx4_ib_alloc_ucontext;
1406 ibdev->ib_dev.dealloc_ucontext = mlx4_ib_dealloc_ucontext;
1407 ibdev->ib_dev.mmap = mlx4_ib_mmap;
1408 ibdev->ib_dev.alloc_pd = mlx4_ib_alloc_pd;
1409 ibdev->ib_dev.dealloc_pd = mlx4_ib_dealloc_pd;
1410 ibdev->ib_dev.create_ah = mlx4_ib_create_ah;
1411 ibdev->ib_dev.query_ah = mlx4_ib_query_ah;
1412 ibdev->ib_dev.destroy_ah = mlx4_ib_destroy_ah;
1413 ibdev->ib_dev.create_srq = mlx4_ib_create_srq;
1414 ibdev->ib_dev.modify_srq = mlx4_ib_modify_srq;
65541cb7 1415 ibdev->ib_dev.query_srq = mlx4_ib_query_srq;
225c7b1f
RD
1416 ibdev->ib_dev.destroy_srq = mlx4_ib_destroy_srq;
1417 ibdev->ib_dev.post_srq_recv = mlx4_ib_post_srq_recv;
1418 ibdev->ib_dev.create_qp = mlx4_ib_create_qp;
1419 ibdev->ib_dev.modify_qp = mlx4_ib_modify_qp;
6a775e2b 1420 ibdev->ib_dev.query_qp = mlx4_ib_query_qp;
225c7b1f
RD
1421 ibdev->ib_dev.destroy_qp = mlx4_ib_destroy_qp;
1422 ibdev->ib_dev.post_send = mlx4_ib_post_send;
1423 ibdev->ib_dev.post_recv = mlx4_ib_post_recv;
1424 ibdev->ib_dev.create_cq = mlx4_ib_create_cq;
3fdcb97f 1425 ibdev->ib_dev.modify_cq = mlx4_ib_modify_cq;
bbf8eed1 1426 ibdev->ib_dev.resize_cq = mlx4_ib_resize_cq;
225c7b1f
RD
1427 ibdev->ib_dev.destroy_cq = mlx4_ib_destroy_cq;
1428 ibdev->ib_dev.poll_cq = mlx4_ib_poll_cq;
1429 ibdev->ib_dev.req_notify_cq = mlx4_ib_arm_cq;
1430 ibdev->ib_dev.get_dma_mr = mlx4_ib_get_dma_mr;
1431 ibdev->ib_dev.reg_user_mr = mlx4_ib_reg_user_mr;
1432 ibdev->ib_dev.dereg_mr = mlx4_ib_dereg_mr;
95d04f07
RD
1433 ibdev->ib_dev.alloc_fast_reg_mr = mlx4_ib_alloc_fast_reg_mr;
1434 ibdev->ib_dev.alloc_fast_reg_page_list = mlx4_ib_alloc_fast_reg_page_list;
1435 ibdev->ib_dev.free_fast_reg_page_list = mlx4_ib_free_fast_reg_page_list;
225c7b1f
RD
1436 ibdev->ib_dev.attach_mcast = mlx4_ib_mcg_attach;
1437 ibdev->ib_dev.detach_mcast = mlx4_ib_mcg_detach;
1438 ibdev->ib_dev.process_mad = mlx4_ib_process_mad;
1439
992e8e6e
JM
1440 if (!mlx4_is_slave(ibdev->dev)) {
1441 ibdev->ib_dev.alloc_fmr = mlx4_ib_fmr_alloc;
1442 ibdev->ib_dev.map_phys_fmr = mlx4_ib_map_phys_fmr;
1443 ibdev->ib_dev.unmap_fmr = mlx4_ib_unmap_fmr;
1444 ibdev->ib_dev.dealloc_fmr = mlx4_ib_fmr_dealloc;
1445 }
8ad11fb6 1446
b425388d
SM
1447 if (dev->caps.flags & MLX4_DEV_CAP_FLAG_MEM_WINDOW ||
1448 dev->caps.bmme_flags & MLX4_BMME_FLAG_TYPE_2_WIN) {
1449 ibdev->ib_dev.alloc_mw = mlx4_ib_alloc_mw;
1450 ibdev->ib_dev.bind_mw = mlx4_ib_bind_mw;
1451 ibdev->ib_dev.dealloc_mw = mlx4_ib_dealloc_mw;
1452
1453 ibdev->ib_dev.uverbs_cmd_mask |=
1454 (1ull << IB_USER_VERBS_CMD_ALLOC_MW) |
1455 (1ull << IB_USER_VERBS_CMD_DEALLOC_MW);
1456 }
1457
012a8ff5
SH
1458 if (dev->caps.flags & MLX4_DEV_CAP_FLAG_XRC) {
1459 ibdev->ib_dev.alloc_xrcd = mlx4_ib_alloc_xrcd;
1460 ibdev->ib_dev.dealloc_xrcd = mlx4_ib_dealloc_xrcd;
1461 ibdev->ib_dev.uverbs_cmd_mask |=
1462 (1ull << IB_USER_VERBS_CMD_OPEN_XRCD) |
1463 (1ull << IB_USER_VERBS_CMD_CLOSE_XRCD);
1464 }
1465
e605b743
SP
1466 mlx4_ib_alloc_eqs(dev, ibdev);
1467
fa417f7b
EC
1468 spin_lock_init(&iboe->lock);
1469
225c7b1f
RD
1470 if (init_node_data(ibdev))
1471 goto err_map;
1472
cfcde11c
OG
1473 for (i = 0; i < ibdev->num_ports; ++i) {
1474 if (mlx4_ib_port_link_layer(&ibdev->ib_dev, i + 1) ==
1475 IB_LINK_LAYER_ETHERNET) {
1476 err = mlx4_counter_alloc(ibdev->dev, &ibdev->counters[i]);
1477 if (err)
1478 ibdev->counters[i] = -1;
1479 } else
1480 ibdev->counters[i] = -1;
1481 }
1482
225c7b1f
RD
1483 spin_lock_init(&ibdev->sm_lock);
1484 mutex_init(&ibdev->cap_mask_mutex);
1485
9a6edb60 1486 if (ib_register_device(&ibdev->ib_dev, NULL))
cfcde11c 1487 goto err_counter;
225c7b1f
RD
1488
1489 if (mlx4_ib_mad_init(ibdev))
1490 goto err_reg;
1491
fc06573d
JM
1492 if (mlx4_ib_init_sriov(ibdev))
1493 goto err_mad;
1494
fa417f7b
EC
1495 if (dev->caps.flags & MLX4_DEV_CAP_FLAG_IBOE && !iboe->nb.notifier_call) {
1496 iboe->nb.notifier_call = mlx4_ib_netdev_event;
1497 err = register_netdevice_notifier(&iboe->nb);
1498 if (err)
fc06573d 1499 goto err_sriov;
fa417f7b
EC
1500 }
1501
035b1032 1502 for (j = 0; j < ARRAY_SIZE(mlx4_class_attributes); ++j) {
f4e91eb4 1503 if (device_create_file(&ibdev->ib_dev.dev,
035b1032 1504 mlx4_class_attributes[j]))
fa417f7b 1505 goto err_notif;
cd9281d8
JM
1506 }
1507
3b4a8cd5
JM
1508 ibdev->ib_active = true;
1509
54679e14
JM
1510 if (mlx4_is_mfunc(ibdev->dev))
1511 init_pkeys(ibdev);
1512
3806d08c
JM
1513 /* create paravirt contexts for any VFs which are active */
1514 if (mlx4_is_master(ibdev->dev)) {
1515 for (j = 0; j < MLX4_MFUNC_MAX; j++) {
1516 if (j == mlx4_master_func_num(ibdev->dev))
1517 continue;
1518 if (mlx4_is_slave_active(ibdev->dev, j))
1519 do_slave_init(ibdev, j, 1);
1520 }
1521 }
225c7b1f
RD
1522 return ibdev;
1523
fa417f7b
EC
1524err_notif:
1525 if (unregister_netdevice_notifier(&ibdev->iboe.nb))
987c8f8f 1526 pr_warn("failure unregistering notifier\n");
fa417f7b
EC
1527 flush_workqueue(wq);
1528
fc06573d
JM
1529err_sriov:
1530 mlx4_ib_close_sriov(ibdev);
1531
1532err_mad:
1533 mlx4_ib_mad_cleanup(ibdev);
1534
225c7b1f
RD
1535err_reg:
1536 ib_unregister_device(&ibdev->ib_dev);
1537
cfcde11c
OG
1538err_counter:
1539 for (; i; --i)
4af3ce0d
RD
1540 if (ibdev->counters[i - 1] != -1)
1541 mlx4_counter_free(ibdev->dev, ibdev->counters[i - 1]);
cfcde11c 1542
225c7b1f
RD
1543err_map:
1544 iounmap(ibdev->uar_map);
1545
1546err_uar:
1547 mlx4_uar_free(dev, &ibdev->priv_uar);
1548
1549err_pd:
1550 mlx4_pd_free(dev, ibdev->priv_pdn);
1551
1552err_dealloc:
1553 ib_dealloc_device(&ibdev->ib_dev);
1554
1555 return NULL;
1556}
1557
1558static void mlx4_ib_remove(struct mlx4_dev *dev, void *ibdev_ptr)
1559{
1560 struct mlx4_ib_dev *ibdev = ibdev_ptr;
1561 int p;
1562
fc06573d 1563 mlx4_ib_close_sriov(ibdev);
a6a47771
YP
1564 mlx4_ib_mad_cleanup(ibdev);
1565 ib_unregister_device(&ibdev->ib_dev);
fa417f7b
EC
1566 if (ibdev->iboe.nb.notifier_call) {
1567 if (unregister_netdevice_notifier(&ibdev->iboe.nb))
987c8f8f 1568 pr_warn("failure unregistering notifier\n");
fa417f7b
EC
1569 ibdev->iboe.nb.notifier_call = NULL;
1570 }
1571 iounmap(ibdev->uar_map);
cfcde11c 1572 for (p = 0; p < ibdev->num_ports; ++p)
4af3ce0d
RD
1573 if (ibdev->counters[p] != -1)
1574 mlx4_counter_free(ibdev->dev, ibdev->counters[p]);
fa417f7b 1575 mlx4_foreach_port(p, dev, MLX4_PORT_TYPE_IB)
225c7b1f
RD
1576 mlx4_CLOSE_PORT(dev, p);
1577
e605b743
SP
1578 mlx4_ib_free_eqs(dev, ibdev);
1579
225c7b1f
RD
1580 mlx4_uar_free(dev, &ibdev->priv_uar);
1581 mlx4_pd_free(dev, ibdev->priv_pdn);
1582 ib_dealloc_device(&ibdev->ib_dev);
1583}
1584
fc06573d
JM
1585static void do_slave_init(struct mlx4_ib_dev *ibdev, int slave, int do_init)
1586{
1587 struct mlx4_ib_demux_work **dm = NULL;
1588 struct mlx4_dev *dev = ibdev->dev;
1589 int i;
1590 unsigned long flags;
1591
1592 if (!mlx4_is_master(dev))
1593 return;
1594
1595 dm = kcalloc(dev->caps.num_ports, sizeof *dm, GFP_ATOMIC);
1596 if (!dm) {
1597 pr_err("failed to allocate memory for tunneling qp update\n");
1598 goto out;
1599 }
1600
1601 for (i = 0; i < dev->caps.num_ports; i++) {
1602 dm[i] = kmalloc(sizeof (struct mlx4_ib_demux_work), GFP_ATOMIC);
1603 if (!dm[i]) {
1604 pr_err("failed to allocate memory for tunneling qp update work struct\n");
1605 for (i = 0; i < dev->caps.num_ports; i++) {
1606 if (dm[i])
1607 kfree(dm[i]);
1608 }
1609 goto out;
1610 }
1611 }
1612 /* initialize or tear down tunnel QPs for the slave */
1613 for (i = 0; i < dev->caps.num_ports; i++) {
1614 INIT_WORK(&dm[i]->work, mlx4_ib_tunnels_update_work);
1615 dm[i]->port = i + 1;
1616 dm[i]->slave = slave;
1617 dm[i]->do_init = do_init;
1618 dm[i]->dev = ibdev;
1619 spin_lock_irqsave(&ibdev->sriov.going_down_lock, flags);
1620 if (!ibdev->sriov.is_going_down)
1621 queue_work(ibdev->sriov.demux[i].ud_wq, &dm[i]->work);
1622 spin_unlock_irqrestore(&ibdev->sriov.going_down_lock, flags);
1623 }
1624out:
c89d1271 1625 kfree(dm);
fc06573d
JM
1626 return;
1627}
1628
225c7b1f 1629static void mlx4_ib_event(struct mlx4_dev *dev, void *ibdev_ptr,
00f5ce99 1630 enum mlx4_dev_event event, unsigned long param)
225c7b1f
RD
1631{
1632 struct ib_event ibev;
7ff93f8b 1633 struct mlx4_ib_dev *ibdev = to_mdev((struct ib_device *) ibdev_ptr);
00f5ce99
JM
1634 struct mlx4_eqe *eqe = NULL;
1635 struct ib_event_work *ew;
fc06573d 1636 int p = 0;
00f5ce99
JM
1637
1638 if (event == MLX4_DEV_EVENT_PORT_MGMT_CHANGE)
1639 eqe = (struct mlx4_eqe *)param;
1640 else
fc06573d 1641 p = (int) param;
225c7b1f
RD
1642
1643 switch (event) {
37608eea 1644 case MLX4_DEV_EVENT_PORT_UP:
fc06573d
JM
1645 if (p > ibdev->num_ports)
1646 return;
a0c64a17
JM
1647 if (mlx4_is_master(dev) &&
1648 rdma_port_get_link_layer(&ibdev->ib_dev, p) ==
1649 IB_LINK_LAYER_INFINIBAND) {
1650 mlx4_ib_invalidate_all_guid_record(ibdev, p);
1651 }
37608eea 1652 ibev.event = IB_EVENT_PORT_ACTIVE;
225c7b1f
RD
1653 break;
1654
37608eea 1655 case MLX4_DEV_EVENT_PORT_DOWN:
fc06573d
JM
1656 if (p > ibdev->num_ports)
1657 return;
37608eea
RD
1658 ibev.event = IB_EVENT_PORT_ERR;
1659 break;
1660
1661 case MLX4_DEV_EVENT_CATASTROPHIC_ERROR:
3b4a8cd5 1662 ibdev->ib_active = false;
225c7b1f
RD
1663 ibev.event = IB_EVENT_DEVICE_FATAL;
1664 break;
1665
00f5ce99
JM
1666 case MLX4_DEV_EVENT_PORT_MGMT_CHANGE:
1667 ew = kmalloc(sizeof *ew, GFP_ATOMIC);
1668 if (!ew) {
1669 pr_err("failed to allocate memory for events work\n");
1670 break;
1671 }
1672
1673 INIT_WORK(&ew->work, handle_port_mgmt_change_event);
1674 memcpy(&ew->ib_eqe, eqe, sizeof *eqe);
1675 ew->ib_dev = ibdev;
992e8e6e
JM
1676 /* need to queue only for port owner, which uses GEN_EQE */
1677 if (mlx4_is_master(dev))
1678 queue_work(wq, &ew->work);
1679 else
1680 handle_port_mgmt_change_event(&ew->work);
00f5ce99
JM
1681 return;
1682
fc06573d
JM
1683 case MLX4_DEV_EVENT_SLAVE_INIT:
1684 /* here, p is the slave id */
1685 do_slave_init(ibdev, p, 1);
1686 return;
1687
1688 case MLX4_DEV_EVENT_SLAVE_SHUTDOWN:
1689 /* here, p is the slave id */
1690 do_slave_init(ibdev, p, 0);
1691 return;
1692
225c7b1f
RD
1693 default:
1694 return;
1695 }
1696
1697 ibev.device = ibdev_ptr;
fc06573d 1698 ibev.element.port_num = (u8) p;
225c7b1f
RD
1699
1700 ib_dispatch_event(&ibev);
1701}
1702
1703static struct mlx4_interface mlx4_ib_interface = {
fa417f7b
EC
1704 .add = mlx4_ib_add,
1705 .remove = mlx4_ib_remove,
1706 .event = mlx4_ib_event,
0345584e 1707 .protocol = MLX4_PROT_IB_IPV6
225c7b1f
RD
1708};
1709
1710static int __init mlx4_ib_init(void)
1711{
fa417f7b
EC
1712 int err;
1713
1714 wq = create_singlethread_workqueue("mlx4_ib");
1715 if (!wq)
1716 return -ENOMEM;
1717
b9c5d6a6
OD
1718 err = mlx4_ib_mcg_init();
1719 if (err)
1720 goto clean_wq;
1721
fa417f7b 1722 err = mlx4_register_interface(&mlx4_ib_interface);
b9c5d6a6
OD
1723 if (err)
1724 goto clean_mcg;
fa417f7b
EC
1725
1726 return 0;
b9c5d6a6
OD
1727
1728clean_mcg:
1729 mlx4_ib_mcg_destroy();
1730
1731clean_wq:
1732 destroy_workqueue(wq);
1733 return err;
225c7b1f
RD
1734}
1735
1736static void __exit mlx4_ib_cleanup(void)
1737{
1738 mlx4_unregister_interface(&mlx4_ib_interface);
b9c5d6a6 1739 mlx4_ib_mcg_destroy();
fa417f7b 1740 destroy_workqueue(wq);
225c7b1f
RD
1741}
1742
1743module_init(mlx4_ib_init);
1744module_exit(mlx4_ib_cleanup);