2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <linux/etherdevice.h>
35 #include <linux/tcp.h>
36 #include <linux/if_vlan.h>
37 #include <linux/delay.h>
38 #include <linux/slab.h>
40 #include <linux/mlx4/driver.h>
41 #include <linux/mlx4/device.h>
42 #include <linux/mlx4/cmd.h>
43 #include <linux/mlx4/cq.h>
49 static void mlx4_en_vlan_rx_register(struct net_device
*dev
, struct vlan_group
*grp
)
51 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
52 struct mlx4_en_dev
*mdev
= priv
->mdev
;
55 en_dbg(HW
, priv
, "Registering VLAN group:%p\n", grp
);
58 mutex_lock(&mdev
->state_lock
);
59 if (mdev
->device_up
&& priv
->port_up
) {
60 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
->port
, grp
);
62 en_err(priv
, "Failed configuring VLAN filter\n");
64 mutex_unlock(&mdev
->state_lock
);
67 static void mlx4_en_vlan_rx_add_vid(struct net_device
*dev
, unsigned short vid
)
69 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
70 struct mlx4_en_dev
*mdev
= priv
->mdev
;
76 en_dbg(HW
, priv
, "adding VLAN:%d (vlgrp entry:%p)\n",
77 vid
, vlan_group_get_device(priv
->vlgrp
, vid
));
79 /* Add VID to port VLAN filter */
80 mutex_lock(&mdev
->state_lock
);
81 if (mdev
->device_up
&& priv
->port_up
) {
82 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
->port
, priv
->vlgrp
);
84 en_err(priv
, "Failed configuring VLAN filter\n");
86 mutex_unlock(&mdev
->state_lock
);
89 static void mlx4_en_vlan_rx_kill_vid(struct net_device
*dev
, unsigned short vid
)
91 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
92 struct mlx4_en_dev
*mdev
= priv
->mdev
;
98 en_dbg(HW
, priv
, "Killing VID:%d (vlgrp:%p vlgrp entry:%p)\n",
99 vid
, priv
->vlgrp
, vlan_group_get_device(priv
->vlgrp
, vid
));
100 vlan_group_set_device(priv
->vlgrp
, vid
, NULL
);
102 /* Remove VID from port VLAN filter */
103 mutex_lock(&mdev
->state_lock
);
104 if (mdev
->device_up
&& priv
->port_up
) {
105 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
->port
, priv
->vlgrp
);
107 en_err(priv
, "Failed configuring VLAN filter\n");
109 mutex_unlock(&mdev
->state_lock
);
112 u64
mlx4_en_mac_to_u64(u8
*addr
)
117 for (i
= 0; i
< ETH_ALEN
; i
++) {
124 static int mlx4_en_set_mac(struct net_device
*dev
, void *addr
)
126 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
127 struct mlx4_en_dev
*mdev
= priv
->mdev
;
128 struct sockaddr
*saddr
= addr
;
130 if (!is_valid_ether_addr(saddr
->sa_data
))
131 return -EADDRNOTAVAIL
;
133 memcpy(dev
->dev_addr
, saddr
->sa_data
, ETH_ALEN
);
134 priv
->mac
= mlx4_en_mac_to_u64(dev
->dev_addr
);
135 queue_work(mdev
->workqueue
, &priv
->mac_task
);
139 static void mlx4_en_do_set_mac(struct work_struct
*work
)
141 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
143 struct mlx4_en_dev
*mdev
= priv
->mdev
;
146 mutex_lock(&mdev
->state_lock
);
148 /* Remove old MAC and insert the new one */
149 mlx4_unregister_mac(mdev
->dev
, priv
->port
, priv
->mac_index
);
150 err
= mlx4_register_mac(mdev
->dev
, priv
->port
,
151 priv
->mac
, &priv
->mac_index
);
153 en_err(priv
, "Failed changing HW MAC address\n");
155 en_dbg(HW
, priv
, "Port is down while "
156 "registering mac, exiting...\n");
158 mutex_unlock(&mdev
->state_lock
);
161 static void mlx4_en_clear_list(struct net_device
*dev
)
163 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
165 kfree(priv
->mc_addrs
);
166 priv
->mc_addrs_cnt
= 0;
169 static void mlx4_en_cache_mclist(struct net_device
*dev
)
171 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
172 struct netdev_hw_addr
*ha
;
174 int mc_addrs_cnt
= netdev_mc_count(dev
);
177 mc_addrs
= kmalloc(mc_addrs_cnt
* ETH_ALEN
, GFP_ATOMIC
);
179 en_err(priv
, "failed to allocate multicast list\n");
183 netdev_for_each_mc_addr(ha
, dev
)
184 memcpy(mc_addrs
+ i
++ * ETH_ALEN
, ha
->addr
, ETH_ALEN
);
185 priv
->mc_addrs
= mc_addrs
;
186 priv
->mc_addrs_cnt
= mc_addrs_cnt
;
190 static void mlx4_en_set_multicast(struct net_device
*dev
)
192 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
197 queue_work(priv
->mdev
->workqueue
, &priv
->mcast_task
);
200 static void mlx4_en_do_set_multicast(struct work_struct
*work
)
202 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
204 struct mlx4_en_dev
*mdev
= priv
->mdev
;
205 struct net_device
*dev
= priv
->dev
;
209 mutex_lock(&mdev
->state_lock
);
210 if (!mdev
->device_up
) {
211 en_dbg(HW
, priv
, "Card is not up, "
212 "ignoring multicast change.\n");
215 if (!priv
->port_up
) {
216 en_dbg(HW
, priv
, "Port is down, "
217 "ignoring multicast change.\n");
222 * Promsicuous mode: disable all filters
225 if (dev
->flags
& IFF_PROMISC
) {
226 if (!(priv
->flags
& MLX4_EN_FLAG_PROMISC
)) {
227 if (netif_msg_rx_status(priv
))
228 en_warn(priv
, "Entering promiscuous mode\n");
229 priv
->flags
|= MLX4_EN_FLAG_PROMISC
;
231 /* Enable promiscouos mode */
232 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
, priv
->port
,
235 en_err(priv
, "Failed enabling "
236 "promiscous mode\n");
238 /* Disable port multicast filter (unconditionally) */
239 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
240 0, MLX4_MCAST_DISABLE
);
242 en_err(priv
, "Failed disabling "
243 "multicast filter\n");
245 /* Disable port VLAN filter */
246 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
->port
, NULL
);
248 en_err(priv
, "Failed disabling VLAN filter\n");
254 * Not in promiscous mode
257 if (priv
->flags
& MLX4_EN_FLAG_PROMISC
) {
258 if (netif_msg_rx_status(priv
))
259 en_warn(priv
, "Leaving promiscuous mode\n");
260 priv
->flags
&= ~MLX4_EN_FLAG_PROMISC
;
262 /* Disable promiscouos mode */
263 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
, priv
->port
,
266 en_err(priv
, "Failed disabling promiscous mode\n");
268 /* Enable port VLAN filter */
269 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
->port
, priv
->vlgrp
);
271 en_err(priv
, "Failed enabling VLAN filter\n");
274 /* Enable/disable the multicast filter according to IFF_ALLMULTI */
275 if (dev
->flags
& IFF_ALLMULTI
) {
276 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
277 0, MLX4_MCAST_DISABLE
);
279 en_err(priv
, "Failed disabling multicast filter\n");
283 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
284 0, MLX4_MCAST_DISABLE
);
286 en_err(priv
, "Failed disabling multicast filter\n");
288 /* Flush mcast filter and init it with broadcast address */
289 mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, ETH_BCAST
,
290 1, MLX4_MCAST_CONFIG
);
292 /* Update multicast list - we cache all addresses so they won't
293 * change while HW is updated holding the command semaphor */
294 netif_tx_lock_bh(dev
);
295 mlx4_en_cache_mclist(dev
);
296 netif_tx_unlock_bh(dev
);
297 for (i
= 0; i
< priv
->mc_addrs_cnt
; i
++) {
299 mlx4_en_mac_to_u64(priv
->mc_addrs
+ i
* ETH_ALEN
);
300 mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
,
301 mcast_addr
, 0, MLX4_MCAST_CONFIG
);
303 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
304 0, MLX4_MCAST_ENABLE
);
306 en_err(priv
, "Failed enabling multicast filter\n");
308 mlx4_en_clear_list(dev
);
311 mutex_unlock(&mdev
->state_lock
);
314 #ifdef CONFIG_NET_POLL_CONTROLLER
315 static void mlx4_en_netpoll(struct net_device
*dev
)
317 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
318 struct mlx4_en_cq
*cq
;
322 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
323 cq
= &priv
->rx_cq
[i
];
324 spin_lock_irqsave(&cq
->lock
, flags
);
325 napi_synchronize(&cq
->napi
);
326 mlx4_en_process_rx_cq(dev
, cq
, 0);
327 spin_unlock_irqrestore(&cq
->lock
, flags
);
332 static void mlx4_en_tx_timeout(struct net_device
*dev
)
334 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
335 struct mlx4_en_dev
*mdev
= priv
->mdev
;
337 if (netif_msg_timer(priv
))
338 en_warn(priv
, "Tx timeout called on port:%d\n", priv
->port
);
340 priv
->port_stats
.tx_timeout
++;
341 en_dbg(DRV
, priv
, "Scheduling watchdog\n");
342 queue_work(mdev
->workqueue
, &priv
->watchdog_task
);
346 static struct net_device_stats
*mlx4_en_get_stats(struct net_device
*dev
)
348 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
350 spin_lock_bh(&priv
->stats_lock
);
351 memcpy(&priv
->ret_stats
, &priv
->stats
, sizeof(priv
->stats
));
352 spin_unlock_bh(&priv
->stats_lock
);
354 return &priv
->ret_stats
;
357 static void mlx4_en_set_default_moderation(struct mlx4_en_priv
*priv
)
359 struct mlx4_en_cq
*cq
;
362 /* If we haven't received a specific coalescing setting
363 * (module param), we set the moderation parameters as follows:
364 * - moder_cnt is set to the number of mtu sized packets to
365 * satisfy our coelsing target.
366 * - moder_time is set to a fixed value.
368 priv
->rx_frames
= MLX4_EN_RX_COAL_TARGET
;
369 priv
->rx_usecs
= MLX4_EN_RX_COAL_TIME
;
370 en_dbg(INTR
, priv
, "Default coalesing params for mtu:%d - "
371 "rx_frames:%d rx_usecs:%d\n",
372 priv
->dev
->mtu
, priv
->rx_frames
, priv
->rx_usecs
);
374 /* Setup cq moderation params */
375 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
376 cq
= &priv
->rx_cq
[i
];
377 cq
->moder_cnt
= priv
->rx_frames
;
378 cq
->moder_time
= priv
->rx_usecs
;
381 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
382 cq
= &priv
->tx_cq
[i
];
383 cq
->moder_cnt
= MLX4_EN_TX_COAL_PKTS
;
384 cq
->moder_time
= MLX4_EN_TX_COAL_TIME
;
387 /* Reset auto-moderation params */
388 priv
->pkt_rate_low
= MLX4_EN_RX_RATE_LOW
;
389 priv
->rx_usecs_low
= MLX4_EN_RX_COAL_TIME_LOW
;
390 priv
->pkt_rate_high
= MLX4_EN_RX_RATE_HIGH
;
391 priv
->rx_usecs_high
= MLX4_EN_RX_COAL_TIME_HIGH
;
392 priv
->sample_interval
= MLX4_EN_SAMPLE_INTERVAL
;
393 priv
->adaptive_rx_coal
= 1;
394 priv
->last_moder_time
= MLX4_EN_AUTO_CONF
;
395 priv
->last_moder_jiffies
= 0;
396 priv
->last_moder_packets
= 0;
397 priv
->last_moder_tx_packets
= 0;
398 priv
->last_moder_bytes
= 0;
401 static void mlx4_en_auto_moderation(struct mlx4_en_priv
*priv
)
403 unsigned long period
= (unsigned long) (jiffies
- priv
->last_moder_jiffies
);
404 struct mlx4_en_cq
*cq
;
405 unsigned long packets
;
407 unsigned long avg_pkt_size
;
408 unsigned long rx_packets
;
409 unsigned long rx_bytes
;
410 unsigned long rx_byte_diff
;
411 unsigned long tx_packets
;
412 unsigned long tx_pkt_diff
;
413 unsigned long rx_pkt_diff
;
417 if (!priv
->adaptive_rx_coal
|| period
< priv
->sample_interval
* HZ
)
420 spin_lock_bh(&priv
->stats_lock
);
421 rx_packets
= priv
->stats
.rx_packets
;
422 rx_bytes
= priv
->stats
.rx_bytes
;
423 tx_packets
= priv
->stats
.tx_packets
;
424 spin_unlock_bh(&priv
->stats_lock
);
426 if (!priv
->last_moder_jiffies
|| !period
)
429 tx_pkt_diff
= ((unsigned long) (tx_packets
-
430 priv
->last_moder_tx_packets
));
431 rx_pkt_diff
= ((unsigned long) (rx_packets
-
432 priv
->last_moder_packets
));
433 packets
= max(tx_pkt_diff
, rx_pkt_diff
);
434 rx_byte_diff
= rx_bytes
- priv
->last_moder_bytes
;
435 rx_byte_diff
= rx_byte_diff
? rx_byte_diff
: 1;
436 rate
= packets
* HZ
/ period
;
437 avg_pkt_size
= packets
? ((unsigned long) (rx_bytes
-
438 priv
->last_moder_bytes
)) / packets
: 0;
440 /* Apply auto-moderation only when packet rate exceeds a rate that
442 if (rate
> MLX4_EN_RX_RATE_THRESH
) {
443 /* If tx and rx packet rates are not balanced, assume that
444 * traffic is mainly BW bound and apply maximum moderation.
445 * Otherwise, moderate according to packet rate */
446 if (2 * tx_pkt_diff
> 3 * rx_pkt_diff
&&
447 rx_pkt_diff
/ rx_byte_diff
<
448 MLX4_EN_SMALL_PKT_SIZE
)
449 moder_time
= priv
->rx_usecs_low
;
450 else if (2 * rx_pkt_diff
> 3 * tx_pkt_diff
)
451 moder_time
= priv
->rx_usecs_high
;
453 if (rate
< priv
->pkt_rate_low
)
454 moder_time
= priv
->rx_usecs_low
;
455 else if (rate
> priv
->pkt_rate_high
)
456 moder_time
= priv
->rx_usecs_high
;
458 moder_time
= (rate
- priv
->pkt_rate_low
) *
459 (priv
->rx_usecs_high
- priv
->rx_usecs_low
) /
460 (priv
->pkt_rate_high
- priv
->pkt_rate_low
) +
464 /* When packet rate is low, use default moderation rather than
465 * 0 to prevent interrupt storms if traffic suddenly increases */
466 moder_time
= priv
->rx_usecs
;
469 en_dbg(INTR
, priv
, "tx rate:%lu rx_rate:%lu\n",
470 tx_pkt_diff
* HZ
/ period
, rx_pkt_diff
* HZ
/ period
);
472 en_dbg(INTR
, priv
, "Rx moder_time changed from:%d to %d period:%lu "
473 "[jiff] packets:%lu avg_pkt_size:%lu rate:%lu [p/s])\n",
474 priv
->last_moder_time
, moder_time
, period
, packets
,
477 if (moder_time
!= priv
->last_moder_time
) {
478 priv
->last_moder_time
= moder_time
;
479 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
480 cq
= &priv
->rx_cq
[i
];
481 cq
->moder_time
= moder_time
;
482 err
= mlx4_en_set_cq_moder(priv
, cq
);
484 en_err(priv
, "Failed modifying moderation for cq:%d\n", i
);
491 priv
->last_moder_packets
= rx_packets
;
492 priv
->last_moder_tx_packets
= tx_packets
;
493 priv
->last_moder_bytes
= rx_bytes
;
494 priv
->last_moder_jiffies
= jiffies
;
497 static void mlx4_en_do_get_stats(struct work_struct
*work
)
499 struct delayed_work
*delay
= to_delayed_work(work
);
500 struct mlx4_en_priv
*priv
= container_of(delay
, struct mlx4_en_priv
,
502 struct mlx4_en_dev
*mdev
= priv
->mdev
;
505 err
= mlx4_en_DUMP_ETH_STATS(mdev
, priv
->port
, 0);
507 en_dbg(HW
, priv
, "Could not update stats\n");
509 mutex_lock(&mdev
->state_lock
);
510 if (mdev
->device_up
) {
512 mlx4_en_auto_moderation(priv
);
514 queue_delayed_work(mdev
->workqueue
, &priv
->stats_task
, STATS_DELAY
);
516 if (mdev
->mac_removed
[MLX4_MAX_PORTS
+ 1 - priv
->port
]) {
517 queue_work(mdev
->workqueue
, &priv
->mac_task
);
518 mdev
->mac_removed
[MLX4_MAX_PORTS
+ 1 - priv
->port
] = 0;
520 mutex_unlock(&mdev
->state_lock
);
523 static void mlx4_en_linkstate(struct work_struct
*work
)
525 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
527 struct mlx4_en_dev
*mdev
= priv
->mdev
;
528 int linkstate
= priv
->link_state
;
530 mutex_lock(&mdev
->state_lock
);
531 /* If observable port state changed set carrier state and
532 * report to system log */
533 if (priv
->last_link_state
!= linkstate
) {
534 if (linkstate
== MLX4_DEV_EVENT_PORT_DOWN
) {
535 en_info(priv
, "Link Down\n");
536 netif_carrier_off(priv
->dev
);
538 en_info(priv
, "Link Up\n");
539 netif_carrier_on(priv
->dev
);
542 priv
->last_link_state
= linkstate
;
543 mutex_unlock(&mdev
->state_lock
);
547 int mlx4_en_start_port(struct net_device
*dev
)
549 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
550 struct mlx4_en_dev
*mdev
= priv
->mdev
;
551 struct mlx4_en_cq
*cq
;
552 struct mlx4_en_tx_ring
*tx_ring
;
560 en_dbg(DRV
, priv
, "start port called while port already up\n");
564 /* Calculate Rx buf size */
565 dev
->mtu
= min(dev
->mtu
, priv
->max_mtu
);
566 mlx4_en_calc_rx_buf(dev
);
567 en_dbg(DRV
, priv
, "Rx buf size:%d\n", priv
->rx_skb_size
);
569 /* Configure rx cq's and rings */
570 err
= mlx4_en_activate_rx_rings(priv
);
572 en_err(priv
, "Failed to activate RX rings\n");
575 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
576 cq
= &priv
->rx_cq
[i
];
578 err
= mlx4_en_activate_cq(priv
, cq
);
580 en_err(priv
, "Failed activating Rx CQ\n");
583 for (j
= 0; j
< cq
->size
; j
++)
584 cq
->buf
[j
].owner_sr_opcode
= MLX4_CQE_OWNER_MASK
;
585 err
= mlx4_en_set_cq_moder(priv
, cq
);
587 en_err(priv
, "Failed setting cq moderation parameters");
588 mlx4_en_deactivate_cq(priv
, cq
);
591 mlx4_en_arm_cq(priv
, cq
);
592 priv
->rx_ring
[i
].cqn
= cq
->mcq
.cqn
;
596 err
= mlx4_en_config_rss_steer(priv
);
598 en_err(priv
, "Failed configuring rss steering\n");
602 /* Configure tx cq's and rings */
603 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
605 cq
= &priv
->tx_cq
[i
];
606 err
= mlx4_en_activate_cq(priv
, cq
);
608 en_err(priv
, "Failed allocating Tx CQ\n");
611 err
= mlx4_en_set_cq_moder(priv
, cq
);
613 en_err(priv
, "Failed setting cq moderation parameters");
614 mlx4_en_deactivate_cq(priv
, cq
);
617 en_dbg(DRV
, priv
, "Resetting index of collapsed CQ:%d to -1\n", i
);
618 cq
->buf
->wqe_index
= cpu_to_be16(0xffff);
621 tx_ring
= &priv
->tx_ring
[i
];
622 err
= mlx4_en_activate_tx_ring(priv
, tx_ring
, cq
->mcq
.cqn
);
624 en_err(priv
, "Failed allocating Tx ring\n");
625 mlx4_en_deactivate_cq(priv
, cq
);
628 /* Set initial ownership of all Tx TXBBs to SW (1) */
629 for (j
= 0; j
< tx_ring
->buf_size
; j
+= STAMP_STRIDE
)
630 *((u32
*) (tx_ring
->buf
+ j
)) = 0xffffffff;
635 err
= mlx4_SET_PORT_general(mdev
->dev
, priv
->port
,
636 priv
->rx_skb_size
+ ETH_FCS_LEN
,
637 priv
->prof
->tx_pause
,
639 priv
->prof
->rx_pause
,
642 en_err(priv
, "Failed setting port general configurations "
643 "for port %d, with error %d\n", priv
->port
, err
);
646 /* Set default qp number */
647 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
, priv
->port
, priv
->base_qpn
, 0);
649 en_err(priv
, "Failed setting default qp numbers\n");
652 /* Set port mac number */
653 en_dbg(DRV
, priv
, "Setting mac for port %d\n", priv
->port
);
654 err
= mlx4_register_mac(mdev
->dev
, priv
->port
,
655 priv
->mac
, &priv
->mac_index
);
657 en_err(priv
, "Failed setting port mac\n");
660 mdev
->mac_removed
[priv
->port
] = 0;
663 en_dbg(HW
, priv
, "Initializing port\n");
664 err
= mlx4_INIT_PORT(mdev
->dev
, priv
->port
);
666 en_err(priv
, "Failed Initializing port\n");
670 /* Schedule multicast task to populate multicast list */
671 queue_work(mdev
->workqueue
, &priv
->mcast_task
);
673 priv
->port_up
= true;
674 netif_tx_start_all_queues(dev
);
678 mlx4_unregister_mac(mdev
->dev
, priv
->port
, priv
->mac_index
);
681 mlx4_en_deactivate_tx_ring(priv
, &priv
->tx_ring
[tx_index
]);
682 mlx4_en_deactivate_cq(priv
, &priv
->tx_cq
[tx_index
]);
685 mlx4_en_release_rss_steer(priv
);
688 mlx4_en_deactivate_cq(priv
, &priv
->rx_cq
[rx_index
]);
689 for (i
= 0; i
< priv
->rx_ring_num
; i
++)
690 mlx4_en_deactivate_rx_ring(priv
, &priv
->rx_ring
[i
]);
692 return err
; /* need to close devices */
696 void mlx4_en_stop_port(struct net_device
*dev
)
698 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
699 struct mlx4_en_dev
*mdev
= priv
->mdev
;
702 if (!priv
->port_up
) {
703 en_dbg(DRV
, priv
, "stop port called while port already down\n");
707 /* Synchronize with tx routine */
708 netif_tx_lock_bh(dev
);
709 netif_tx_stop_all_queues(dev
);
710 netif_tx_unlock_bh(dev
);
712 /* Set port as not active */
713 priv
->port_up
= false;
715 /* Unregister Mac address for the port */
716 mlx4_unregister_mac(mdev
->dev
, priv
->port
, priv
->mac_index
);
717 mdev
->mac_removed
[priv
->port
] = 1;
720 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
721 mlx4_en_deactivate_tx_ring(priv
, &priv
->tx_ring
[i
]);
722 mlx4_en_deactivate_cq(priv
, &priv
->tx_cq
[i
]);
726 for (i
= 0; i
< priv
->tx_ring_num
; i
++)
727 mlx4_en_free_tx_buf(dev
, &priv
->tx_ring
[i
]);
730 mlx4_en_release_rss_steer(priv
);
733 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
734 mlx4_en_deactivate_rx_ring(priv
, &priv
->rx_ring
[i
]);
735 while (test_bit(NAPI_STATE_SCHED
, &priv
->rx_cq
[i
].napi
.state
))
737 mlx4_en_deactivate_cq(priv
, &priv
->rx_cq
[i
]);
741 mlx4_CLOSE_PORT(mdev
->dev
, priv
->port
);
744 static void mlx4_en_restart(struct work_struct
*work
)
746 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
748 struct mlx4_en_dev
*mdev
= priv
->mdev
;
749 struct net_device
*dev
= priv
->dev
;
751 en_dbg(DRV
, priv
, "Watchdog task called for port %d\n", priv
->port
);
753 mutex_lock(&mdev
->state_lock
);
755 mlx4_en_stop_port(dev
);
756 if (mlx4_en_start_port(dev
))
757 en_err(priv
, "Failed restarting port %d\n", priv
->port
);
759 mutex_unlock(&mdev
->state_lock
);
763 static int mlx4_en_open(struct net_device
*dev
)
765 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
766 struct mlx4_en_dev
*mdev
= priv
->mdev
;
770 mutex_lock(&mdev
->state_lock
);
772 if (!mdev
->device_up
) {
773 en_err(priv
, "Cannot open - device down/disabled\n");
778 /* Reset HW statistics and performance counters */
779 if (mlx4_en_DUMP_ETH_STATS(mdev
, priv
->port
, 1))
780 en_dbg(HW
, priv
, "Failed dumping statistics\n");
782 memset(&priv
->stats
, 0, sizeof(priv
->stats
));
783 memset(&priv
->pstats
, 0, sizeof(priv
->pstats
));
785 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
786 priv
->tx_ring
[i
].bytes
= 0;
787 priv
->tx_ring
[i
].packets
= 0;
789 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
790 priv
->rx_ring
[i
].bytes
= 0;
791 priv
->rx_ring
[i
].packets
= 0;
794 mlx4_en_set_default_moderation(priv
);
795 err
= mlx4_en_start_port(dev
);
797 en_err(priv
, "Failed starting port:%d\n", priv
->port
);
800 mutex_unlock(&mdev
->state_lock
);
805 static int mlx4_en_close(struct net_device
*dev
)
807 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
808 struct mlx4_en_dev
*mdev
= priv
->mdev
;
810 en_dbg(IFDOWN
, priv
, "Close port called\n");
812 mutex_lock(&mdev
->state_lock
);
814 mlx4_en_stop_port(dev
);
815 netif_carrier_off(dev
);
817 mutex_unlock(&mdev
->state_lock
);
821 void mlx4_en_free_resources(struct mlx4_en_priv
*priv
)
825 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
826 if (priv
->tx_ring
[i
].tx_info
)
827 mlx4_en_destroy_tx_ring(priv
, &priv
->tx_ring
[i
]);
828 if (priv
->tx_cq
[i
].buf
)
829 mlx4_en_destroy_cq(priv
, &priv
->tx_cq
[i
]);
832 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
833 if (priv
->rx_ring
[i
].rx_info
)
834 mlx4_en_destroy_rx_ring(priv
, &priv
->rx_ring
[i
]);
835 if (priv
->rx_cq
[i
].buf
)
836 mlx4_en_destroy_cq(priv
, &priv
->rx_cq
[i
]);
840 int mlx4_en_alloc_resources(struct mlx4_en_priv
*priv
)
842 struct mlx4_en_port_profile
*prof
= priv
->prof
;
845 /* Create tx Rings */
846 for (i
= 0; i
< priv
->tx_ring_num
; i
++) {
847 if (mlx4_en_create_cq(priv
, &priv
->tx_cq
[i
],
848 prof
->tx_ring_size
, i
, TX
))
851 if (mlx4_en_create_tx_ring(priv
, &priv
->tx_ring
[i
],
852 prof
->tx_ring_size
, TXBB_SIZE
))
856 /* Create rx Rings */
857 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
858 if (mlx4_en_create_cq(priv
, &priv
->rx_cq
[i
],
859 prof
->rx_ring_size
, i
, RX
))
862 if (mlx4_en_create_rx_ring(priv
, &priv
->rx_ring
[i
],
863 prof
->rx_ring_size
, priv
->stride
))
870 en_err(priv
, "Failed to allocate NIC resources\n");
875 void mlx4_en_destroy_netdev(struct net_device
*dev
)
877 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
878 struct mlx4_en_dev
*mdev
= priv
->mdev
;
880 en_dbg(DRV
, priv
, "Destroying netdev on port:%d\n", priv
->port
);
882 /* Unregister device - this will close the port if it was up */
883 if (priv
->registered
)
884 unregister_netdev(dev
);
887 mlx4_free_hwq_res(mdev
->dev
, &priv
->res
, MLX4_EN_PAGE_SIZE
);
889 cancel_delayed_work(&priv
->stats_task
);
890 /* flush any pending task for this netdev */
891 flush_workqueue(mdev
->workqueue
);
893 /* Detach the netdev so tasks would not attempt to access it */
894 mutex_lock(&mdev
->state_lock
);
895 mdev
->pndev
[priv
->port
] = NULL
;
896 mutex_unlock(&mdev
->state_lock
);
898 mlx4_en_free_resources(priv
);
902 static int mlx4_en_change_mtu(struct net_device
*dev
, int new_mtu
)
904 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
905 struct mlx4_en_dev
*mdev
= priv
->mdev
;
908 en_dbg(DRV
, priv
, "Change MTU called - current:%d new:%d\n",
911 if ((new_mtu
< MLX4_EN_MIN_MTU
) || (new_mtu
> priv
->max_mtu
)) {
912 en_err(priv
, "Bad MTU size:%d.\n", new_mtu
);
917 if (netif_running(dev
)) {
918 mutex_lock(&mdev
->state_lock
);
919 if (!mdev
->device_up
) {
920 /* NIC is probably restarting - let watchdog task reset
922 en_dbg(DRV
, priv
, "Change MTU called with card down!?\n");
924 mlx4_en_stop_port(dev
);
925 mlx4_en_set_default_moderation(priv
);
926 err
= mlx4_en_start_port(dev
);
928 en_err(priv
, "Failed restarting port:%d\n",
930 queue_work(mdev
->workqueue
, &priv
->watchdog_task
);
933 mutex_unlock(&mdev
->state_lock
);
938 static const struct net_device_ops mlx4_netdev_ops
= {
939 .ndo_open
= mlx4_en_open
,
940 .ndo_stop
= mlx4_en_close
,
941 .ndo_start_xmit
= mlx4_en_xmit
,
942 .ndo_select_queue
= mlx4_en_select_queue
,
943 .ndo_get_stats
= mlx4_en_get_stats
,
944 .ndo_set_multicast_list
= mlx4_en_set_multicast
,
945 .ndo_set_mac_address
= mlx4_en_set_mac
,
946 .ndo_validate_addr
= eth_validate_addr
,
947 .ndo_change_mtu
= mlx4_en_change_mtu
,
948 .ndo_tx_timeout
= mlx4_en_tx_timeout
,
949 .ndo_vlan_rx_register
= mlx4_en_vlan_rx_register
,
950 .ndo_vlan_rx_add_vid
= mlx4_en_vlan_rx_add_vid
,
951 .ndo_vlan_rx_kill_vid
= mlx4_en_vlan_rx_kill_vid
,
952 #ifdef CONFIG_NET_POLL_CONTROLLER
953 .ndo_poll_controller
= mlx4_en_netpoll
,
957 int mlx4_en_init_netdev(struct mlx4_en_dev
*mdev
, int port
,
958 struct mlx4_en_port_profile
*prof
)
960 struct net_device
*dev
;
961 struct mlx4_en_priv
*priv
;
965 dev
= alloc_etherdev_mq(sizeof(struct mlx4_en_priv
), prof
->tx_ring_num
);
967 mlx4_err(mdev
, "Net device allocation failed\n");
971 SET_NETDEV_DEV(dev
, &mdev
->dev
->pdev
->dev
);
972 dev
->dev_id
= port
- 1;
975 * Initialize driver private data
978 priv
= netdev_priv(dev
);
979 memset(priv
, 0, sizeof(struct mlx4_en_priv
));
984 priv
->port_up
= false;
986 priv
->flags
= prof
->flags
;
987 priv
->tx_ring_num
= prof
->tx_ring_num
;
988 priv
->rx_ring_num
= prof
->rx_ring_num
;
989 priv
->mac_index
= -1;
990 priv
->msg_enable
= MLX4_EN_MSG_LEVEL
;
991 spin_lock_init(&priv
->stats_lock
);
992 INIT_WORK(&priv
->mcast_task
, mlx4_en_do_set_multicast
);
993 INIT_WORK(&priv
->mac_task
, mlx4_en_do_set_mac
);
994 INIT_WORK(&priv
->watchdog_task
, mlx4_en_restart
);
995 INIT_WORK(&priv
->linkstate_task
, mlx4_en_linkstate
);
996 INIT_DELAYED_WORK(&priv
->stats_task
, mlx4_en_do_get_stats
);
998 /* Query for default mac and max mtu */
999 priv
->max_mtu
= mdev
->dev
->caps
.eth_mtu_cap
[priv
->port
];
1000 priv
->mac
= mdev
->dev
->caps
.def_mac
[priv
->port
];
1001 if (ILLEGAL_MAC(priv
->mac
)) {
1002 en_err(priv
, "Port: %d, invalid mac burned: 0x%llx, quiting\n",
1003 priv
->port
, priv
->mac
);
1008 priv
->stride
= roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc
) +
1009 DS_SIZE
* MLX4_EN_MAX_RX_FRAGS
);
1010 err
= mlx4_en_alloc_resources(priv
);
1014 /* Allocate page for receive rings */
1015 err
= mlx4_alloc_hwq_res(mdev
->dev
, &priv
->res
,
1016 MLX4_EN_PAGE_SIZE
, MLX4_EN_PAGE_SIZE
);
1018 en_err(priv
, "Failed to allocate page for rx qps\n");
1021 priv
->allocated
= 1;
1024 * Initialize netdev entry points
1026 dev
->netdev_ops
= &mlx4_netdev_ops
;
1027 dev
->watchdog_timeo
= MLX4_EN_WATCHDOG_TIMEOUT
;
1028 netif_set_real_num_tx_queues(dev
, priv
->tx_ring_num
);
1029 netif_set_real_num_rx_queues(dev
, priv
->rx_ring_num
);
1031 SET_ETHTOOL_OPS(dev
, &mlx4_en_ethtool_ops
);
1033 /* Set defualt MAC */
1034 dev
->addr_len
= ETH_ALEN
;
1035 for (i
= 0; i
< ETH_ALEN
; i
++) {
1036 dev
->dev_addr
[ETH_ALEN
- 1 - i
] = (u8
) (priv
->mac
>> (8 * i
));
1037 dev
->perm_addr
[ETH_ALEN
- 1 - i
] = (u8
) (priv
->mac
>> (8 * i
));
1041 * Set driver features
1043 dev
->features
|= NETIF_F_SG
;
1044 dev
->vlan_features
|= NETIF_F_SG
;
1045 dev
->features
|= NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
;
1046 dev
->vlan_features
|= NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
;
1047 dev
->features
|= NETIF_F_HIGHDMA
;
1048 dev
->features
|= NETIF_F_HW_VLAN_TX
|
1049 NETIF_F_HW_VLAN_RX
|
1050 NETIF_F_HW_VLAN_FILTER
;
1051 dev
->features
|= NETIF_F_GRO
;
1052 if (mdev
->LSO_support
) {
1053 dev
->features
|= NETIF_F_TSO
;
1054 dev
->features
|= NETIF_F_TSO6
;
1055 dev
->vlan_features
|= NETIF_F_TSO
;
1056 dev
->vlan_features
|= NETIF_F_TSO6
;
1059 mdev
->pndev
[port
] = dev
;
1061 netif_carrier_off(dev
);
1062 err
= register_netdev(dev
);
1064 en_err(priv
, "Netdev registration failed for port %d\n", port
);
1068 en_warn(priv
, "Using %d TX rings\n", prof
->tx_ring_num
);
1069 en_warn(priv
, "Using %d RX rings\n", prof
->rx_ring_num
);
1071 priv
->registered
= 1;
1072 queue_delayed_work(mdev
->workqueue
, &priv
->stats_task
, STATS_DELAY
);
1076 mlx4_en_destroy_netdev(dev
);