staging: unisys: Add s-Par visornic ethernet driver
authorDavid Kershner <david.kershner@unisys.com>
Tue, 16 Jun 2015 03:31:59 +0000 (23:31 -0400)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Tue, 16 Jun 2015 21:34:55 +0000 (14:34 -0700)
This driver creates a network device when s-Par sends a device
create message to create network adapter on the visorbus. When
the message is received by visorbus, the visornic_probe function
is called and the netdev device is created and managed by the
visornic driver.

Signed-off-by: David Kershner <david.kershner@unisys.com>
Signed-off-by: Benjamin Romer <benjamin.romer@unisys.com>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
drivers/staging/unisys/Kconfig
drivers/staging/unisys/Makefile
drivers/staging/unisys/visornic/Kconfig [new file with mode: 0644]
drivers/staging/unisys/visornic/Makefile [new file with mode: 0644]
drivers/staging/unisys/visornic/visornic_main.c [new file with mode: 0644]

index 0c3e9a1368a87294e1d7ddce4d30723f8d389bf4..778f9d05f98a83646604cc98f618af37591af4d5 100644 (file)
@@ -12,5 +12,6 @@ menuconfig UNISYSSPAR
 if UNISYSSPAR
 
 source "drivers/staging/unisys/visorbus/Kconfig"
+source "drivers/staging/unisys/visornic/Kconfig"
 
 endif # UNISYSSPAR
index 566af8e39aea53ae01411f28779384315c8e3f87..a515ebc4f8ecfaa36e4dd622b5791bdb4d4c1eab 100644 (file)
@@ -2,3 +2,4 @@
 # Makefile for Unisys SPAR drivers
 #
 obj-$(CONFIG_UNISYS_VISORBUS)          += visorbus/
+obj-$(CONFIG_UNISYS_VISORNIC)          += visornic/
diff --git a/drivers/staging/unisys/visornic/Kconfig b/drivers/staging/unisys/visornic/Kconfig
new file mode 100644 (file)
index 0000000..1676dc7
--- /dev/null
@@ -0,0 +1,15 @@
+#
+# Unisys visornic configuration
+#
+
+config UNISYS_VISORNIC
+       tristate "Unisys visornic driver"
+       depends on UNISYSSPAR && UNISYS_VISORBUS && NET
+       ---help---
+       The Unisys Visornic driver provides support for s-Par network
+       devices exposed on the s-Par visorbus. When a message is sent
+       to visorbus to create a network device, the probe function of
+       visornic is called to create the netdev device. Networking on
+       s-Par switches will not work if this driver is not selected.
+       If you say Y here, you will enable the Unisys visornic driver.
+
diff --git a/drivers/staging/unisys/visornic/Makefile b/drivers/staging/unisys/visornic/Makefile
new file mode 100644 (file)
index 0000000..439e95e
--- /dev/null
@@ -0,0 +1,10 @@
+#
+# Makefile for Unisys channel
+#
+
+obj-$(CONFIG_UNISYS_VISORNIC)  += visornic.o
+
+visornic-y := visornic_main.o
+
+ccflags-y += -Idrivers/staging/unisys/include
+
diff --git a/drivers/staging/unisys/visornic/visornic_main.c b/drivers/staging/unisys/visornic/visornic_main.c
new file mode 100644 (file)
index 0000000..7100744
--- /dev/null
@@ -0,0 +1,2140 @@
+/* Copyright (c) 2012 - 2015 UNISYS CORPORATION
+ * All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or (at
+ * your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or
+ * NON INFRINGEMENT.  See the GNU General Public License for more
+ * details.
+ */
+
+/* This driver lives in a spar partition, and registers to ethernet io
+ * channels from the visorbus driver. It creates netdev devices and
+ * forwards transmit to the IO channel and accepts rcvs from the IO
+ * Partition via the IO channel.
+ */
+
+#include <linux/debugfs.h>
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/skbuff.h>
+#include <linux/kthread.h>
+
+#include "visorbus.h"
+#include "iochannel.h"
+
+#define VISORNIC_INFINITE_RESPONSE_WAIT 0
+#define VISORNICSOPENMAX 32
+#define MAXDEVICES     16384
+
+/* MAX_BUF = 64 lines x 32 MAXVNIC x 80 characters
+ *         = 163840 bytes
+ */
+#define MAX_BUF 163840
+
+static spinlock_t dev_num_pool_lock;
+static void *dev_num_pool;     /**< pool to grab device numbers from */
+
+static int visornic_probe(struct visor_device *dev);
+static void visornic_remove(struct visor_device *dev);
+static int visornic_pause(struct visor_device *dev,
+                         visorbus_state_complete_func complete_func);
+static int visornic_resume(struct visor_device *dev,
+                          visorbus_state_complete_func complete_func);
+
+/* DEBUGFS declarations */
+static ssize_t info_debugfs_read(struct file *file, char __user *buf,
+                                size_t len, loff_t *offset);
+static ssize_t enable_ints_write(struct file *file, const char __user *buf,
+                                size_t len, loff_t *ppos);
+static struct dentry *visornic_debugfs_dir;
+static const struct file_operations debugfs_info_fops = {
+       .read = info_debugfs_read,
+};
+
+static const struct file_operations debugfs_enable_ints_fops = {
+       .write = enable_ints_write,
+};
+
+static struct workqueue_struct *visornic_serverdown_workqueue;
+static struct workqueue_struct *visornic_timeout_reset_workqueue;
+
+/* GUIDS for director channel type supported by this driver.  */
+static struct visor_channeltype_descriptor visornic_channel_types[] = {
+       /* Note that the only channel type we expect to be reported by the
+        * bus driver is the SPAR_VNIC channel.
+        */
+       { SPAR_VNIC_CHANNEL_PROTOCOL_UUID, "ultravnic" },
+       { NULL_UUID_LE, NULL }
+};
+
+/* This is used to tell the visor bus driver which types of visor devices
+ * we support, and what functions to call when a visor device that we support
+ * is attached or removed.
+ */
+static struct visor_driver visornic_driver = {
+       .name = "visornic",
+       .version = "1.0.0.0",
+       .vertag = NULL,
+       .owner = THIS_MODULE,
+       .channel_types = visornic_channel_types,
+       .probe = visornic_probe,
+       .remove = visornic_remove,
+       .pause = visornic_pause,
+       .resume = visornic_resume,
+       .channel_interrupt = NULL,
+};
+
+struct visor_thread_info {
+       struct task_struct *task;
+       struct completion has_stopped;
+       int id;
+};
+
+struct chanstat {
+       unsigned long got_rcv;
+       unsigned long got_enbdisack;
+       unsigned long got_xmit_done;
+       unsigned long xmit_fail;
+       unsigned long sent_enbdis;
+       unsigned long sent_promisc;
+       unsigned long sent_post;
+       unsigned long sent_xmit;
+       unsigned long reject_count;
+       unsigned long extra_rcvbufs_sent;
+};
+
+struct visornic_devdata {
+       int devnum;
+       int thread_wait_ms;
+       unsigned short enabled;         /* 0 disabled 1 enabled to receive */
+       unsigned short enab_dis_acked;  /* NET_RCV_ENABLE/DISABLE acked by
+                                        * IOPART
+                                        */
+       struct visor_device *dev;
+       char name[99];
+       struct list_head list_all;   /* < link within list_all_devices list */
+       struct kref kref;
+       struct net_device *netdev;
+       struct net_device_stats net_stats;
+       atomic_t interrupt_rcvd;
+       wait_queue_head_t rsp_queue;
+       struct sk_buff **rcvbuf;
+       u64 uniquenum; /* TODO figure out why not used */
+       unsigned short old_flags;       /* flags as they were prior to
+                                        * set_multicast_list
+                                        */
+       atomic_t usage;                 /* count of users */
+       int num_rcv_bufs;               /* indicates how many rcv buffers
+                                        * the vnic will post
+                                        */
+       int num_rcv_bufs_could_not_alloc;
+       atomic_t num_rcvbuf_in_iovm;
+       unsigned long alloc_failed_in_if_needed_cnt;
+       unsigned long alloc_failed_in_repost_rtn_cnt;
+       int max_outstanding_net_xmits;   /* absolute max number of outstanding
+                                         * xmits - should never hit this
+                                         */
+       int upper_threshold_net_xmits;   /* high water mark for calling
+                                         * netif_stop_queue()
+                                         */
+       int lower_threshold_net_xmits;   /* high water mark for calling
+                                         * netif_wake_queue()
+                                         */
+       struct sk_buff_head xmitbufhead; /* xmitbufhead is the head of the
+                                         * xmit buffer list that have been
+                                         * sent to the IOPART end
+                                         */
+       struct work_struct serverdown_completion;
+       struct work_struct timeout_reset;
+       struct uiscmdrsp *cmdrsp_rcv;    /* cmdrsp_rcv is used for
+                                         * posting/unposting rcv buffers
+                                         */
+       struct uiscmdrsp *xmit_cmdrsp;   /* used to issue NET_XMIT - there is
+                                         * never more that one xmit in
+                                         * progress at a time
+                                         */
+       bool server_down;                /* IOPART is down */
+       bool server_change_state;        /* Processing SERVER_CHANGESTATE msg */
+       struct dentry *eth_debugfs_dir;
+       struct visor_thread_info threadinfo;
+       u64 interrupts_rcvd;
+       u64 interrupts_notme;
+       u64 interrupts_disabled;
+       u64 busy_cnt;
+       spinlock_t priv_lock;  /* spinlock to access devdata structures */
+
+       /* flow control counter */
+       u64 flow_control_upper_hits;
+       u64 flow_control_lower_hits;
+
+       /* debug counters */
+       unsigned long n_rcv0;                   /* # rcvs of 0 buffers */
+       unsigned long n_rcv1;                   /* # rcvs of 1 buffers */
+       unsigned long n_rcv2;                   /* # rcvs of 2 buffers */
+       unsigned long n_rcvx;                   /* # rcvs of >2 buffers */
+       unsigned long found_repost_rcvbuf_cnt;  /* # times we called
+                                                *   repost_rcvbuf_cnt
+                                                */
+       unsigned long repost_found_skb_cnt;     /* # times found the skb */
+       unsigned long n_repost_deficit;         /* # times we couldn't find
+                                                *   all of the rcv buffers
+                                                */
+       unsigned long bad_rcv_buf;              /* # times we negleted to
+                                                * free the rcv skb because
+                                                * we didn't know where it
+                                                * came from
+                                                */
+       unsigned long n_rcv_packets_not_accepted;/* # bogs rcv packets */
+
+       int queuefullmsg_logged;
+       struct chanstat chstat;
+};
+
+/* array of open devices maintained by open() and close() */
+static struct net_device *num_visornic_open[VISORNICSOPENMAX];
+
+/* List of all visornic_devdata structs,
+ * linked via the list_all member
+ */
+static LIST_HEAD(list_all_devices);
+static DEFINE_SPINLOCK(lock_all_devices);
+
+/**
+ *     visor_copy_fragsinfo_from_skb(
+ *     @skb_in: skbuff that we are pulling the frags from
+ *     @firstfraglen: length of first fragment in skb
+ *     @frags_max: max len of frags array
+ *     @frags: frags array filled in on output
+ *
+ *     Copy the fragment list in the SKB to a phys_info
+ *     array that the IOPART understands.
+ *     Return value indicates number of entries filled in frags
+ *     Negative values indicate an error.
+ */
+static unsigned int
+visor_copy_fragsinfo_from_skb(struct sk_buff *skb, unsigned int firstfraglen,
+                             unsigned int frags_max,
+                             struct phys_info frags[])
+{
+       unsigned int count = 0, ii, size, offset = 0, numfrags;
+
+       numfrags = skb_shinfo(skb)->nr_frags;
+
+       while (firstfraglen) {
+               if (count == frags_max)
+                       return -EINVAL;
+
+               frags[count].pi_pfn =
+                       page_to_pfn(virt_to_page(skb->data + offset));
+               frags[count].pi_off =
+                       (unsigned long)(skb->data + offset) & PI_PAGE_MASK;
+               size = min_t(unsigned int, firstfraglen,
+                            PI_PAGE_SIZE - frags[count].pi_off);
+
+               /* can take smallest of firstfraglen (what's left) OR
+                * bytes left in the page
+                */
+               frags[count].pi_len = size;
+               firstfraglen -= size;
+               offset += size;
+               count++;
+       }
+       if (numfrags) {
+               if ((count + numfrags) > frags_max)
+                       return -EINVAL;
+
+               for (ii = 0; ii < numfrags; ii++) {
+                       count = add_physinfo_entries(page_to_pfn(
+                               skb_frag_page(&skb_shinfo(skb)->frags[ii])),
+                                             skb_shinfo(skb)->frags[ii].
+                                             page_offset,
+                                             skb_shinfo(skb)->frags[ii].
+                                             size, count, frags_max, frags);
+                       if (!count)
+                               return -EIO;
+               }
+       }
+       if (skb_shinfo(skb)->frag_list) {
+               struct sk_buff *skbinlist;
+               int c;
+
+               for (skbinlist = skb_shinfo(skb)->frag_list; skbinlist;
+                    skbinlist = skbinlist->next) {
+                       c = visor_copy_fragsinfo_from_skb(skbinlist,
+                                                         skbinlist->len -
+                                                         skbinlist->data_len,
+                                                         frags_max - count,
+                                                         &frags[count]);
+                       if (c < 0)
+                               return c;
+                       count += c;
+               }
+       }
+       return count;
+}
+
+/**
+ *     visort_thread_start - starts thread for the device
+ *     @thrinfo: The thread to start
+ *     @threadfn: Function the thread starts
+ *     @thrcontext: Context to pass to the thread, i.e. devdata
+ *     @name:  string describing name of thread
+ *
+ *     Starts a thread for the device, currently only thread is
+ *     process_incoming_rsps
+ *     Returns 0 on success;
+ */
+static int visor_thread_start(struct visor_thread_info *thrinfo,
+                             int (*threadfn)(void *),
+                             void *thrcontext, char *name)
+{
+       /* used to stop the thread */
+       init_completion(&thrinfo->has_stopped);
+       thrinfo->task = kthread_run(threadfn, thrcontext, name);
+       if (IS_ERR(thrinfo->task)) {
+               thrinfo->id = 0;
+               return -EINVAL;
+       }
+       thrinfo->id = thrinfo->task->pid;
+       return 0;
+}
+
+/**
+ *     visor_thread_stop - stop a thread for the device
+ *     @thrinfo: The thread to stop
+ *
+ *     Stop the thread and wait for completion for a minute
+ *     Returns void.
+ */
+static void visor_thread_stop(struct visor_thread_info *thrinfo)
+{
+       if (!thrinfo->id)
+               return; /* thread not running */
+
+       kthread_stop(thrinfo->task);
+       /* give up if the thread has NOT died in 1 minute */
+       if (wait_for_completion_timeout(&thrinfo->has_stopped, 60 * HZ))
+               thrinfo->id = 0;
+}
+
+/* DebugFS code */
+static ssize_t info_debugfs_read(struct file *file, char __user *buf,
+                                size_t len, loff_t *offset)
+{
+       int i;
+       ssize_t bytes_read = 0;
+       int str_pos = 0;
+       struct visornic_devdata *devdata;
+       char *vbuf;
+
+       if (len > MAX_BUF)
+               len = MAX_BUF;
+       vbuf = kzalloc(len, GFP_KERNEL);
+       if (!vbuf)
+               return -ENOMEM;
+
+       /* for each vnic channel
+        * dump out channel specific data
+        */
+       for (i = 0; i < VISORNICSOPENMAX; i++) {
+               if (!num_visornic_open[i])
+                       continue;
+
+               devdata = netdev_priv(num_visornic_open[i]);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    "Vnic i = %d\n", i);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    "netdev = %s (0x%p), MAC Addr %pM\n",
+                                    num_visornic_open[i]->name,
+                                    num_visornic_open[i],
+                                    num_visornic_open[i]->dev_addr);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    "VisorNic Dev Info = 0x%p\n", devdata);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " num_rcv_bufs = %d\n",
+                                    devdata->num_rcv_bufs);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " max_oustanding_next_xmits = %d\n",
+                                   devdata->max_outstanding_net_xmits);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " upper_threshold_net_xmits = %d\n",
+                                    devdata->upper_threshold_net_xmits);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " lower_threshold_net_xmits = %d\n",
+                                    devdata->lower_threshold_net_xmits);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " queuefullmsg_logged = %d\n",
+                                    devdata->queuefullmsg_logged);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.got_rcv = %lu\n",
+                                    devdata->chstat.got_rcv);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.got_enbdisack = %lu\n",
+                                    devdata->chstat.got_enbdisack);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.got_xmit_done = %lu\n",
+                                    devdata->chstat.got_xmit_done);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.xmit_fail = %lu\n",
+                                    devdata->chstat.xmit_fail);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.sent_enbdis = %lu\n",
+                                    devdata->chstat.sent_enbdis);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.sent_promisc = %lu\n",
+                                    devdata->chstat.sent_promisc);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.sent_post = %lu\n",
+                                    devdata->chstat.sent_post);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.sent_xmit = %lu\n",
+                                    devdata->chstat.sent_xmit);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.reject_count = %lu\n",
+                                    devdata->chstat.reject_count);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " chstat.extra_rcvbufs_sent = %lu\n",
+                                    devdata->chstat.extra_rcvbufs_sent);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_rcv0 = %lu\n", devdata->n_rcv0);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_rcv1 = %lu\n", devdata->n_rcv1);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_rcv2 = %lu\n", devdata->n_rcv2);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_rcvx = %lu\n", devdata->n_rcvx);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " num_rcvbuf_in_iovm = %d\n",
+                                    atomic_read(&devdata->num_rcvbuf_in_iovm));
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " alloc_failed_in_if_needed_cnt = %lu\n",
+                                    devdata->alloc_failed_in_if_needed_cnt);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " alloc_failed_in_repost_rtn_cnt = %lu\n",
+                                    devdata->alloc_failed_in_repost_rtn_cnt);
+               /* str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                *                   " inner_loop_limit_reached_cnt = %lu\n",
+                *                   devdata->inner_loop_limit_reached_cnt);
+                */
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " found_repost_rcvbuf_cnt = %lu\n",
+                                    devdata->found_repost_rcvbuf_cnt);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " repost_found_skb_cnt = %lu\n",
+                                    devdata->repost_found_skb_cnt);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_repost_deficit = %lu\n",
+                                    devdata->n_repost_deficit);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " bad_rcv_buf = %lu\n",
+                                    devdata->bad_rcv_buf);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " n_rcv_packets_not_accepted = %lu\n",
+                                    devdata->n_rcv_packets_not_accepted);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " interrupts_rcvd = %llu\n",
+                                    devdata->interrupts_rcvd);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " interrupts_notme = %llu\n",
+                                    devdata->interrupts_notme);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " interrupts_disabled = %llu\n",
+                                    devdata->interrupts_disabled);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " busy_cnt = %llu\n",
+                                    devdata->busy_cnt);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " flow_control_upper_hits = %llu\n",
+                                    devdata->flow_control_upper_hits);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " flow_control_lower_hits = %llu\n",
+                                    devdata->flow_control_lower_hits);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " thread_wait_ms = %d\n",
+                                    devdata->thread_wait_ms);
+               str_pos += scnprintf(vbuf + str_pos, len - str_pos,
+                                    " netif_queue = %s\n",
+                                    netif_queue_stopped(devdata->netdev) ?
+                                    "stopped" : "running");
+       }
+       bytes_read = simple_read_from_buffer(buf, len, offset, vbuf, str_pos);
+       kfree(vbuf);
+       return bytes_read;
+}
+
+static ssize_t enable_ints_write(struct file *file,
+                                const char __user *buffer,
+                                size_t count, loff_t *ppos)
+{
+       char buf[4];
+       int i, new_value;
+       struct visornic_devdata *devdata;
+
+       if (count >= ARRAY_SIZE(buf))
+               return -EINVAL;
+
+       buf[count] = '\0';
+       if (copy_from_user(buf, buffer, count))
+               return -EFAULT;
+
+       i = kstrtoint(buf, 10, &new_value);
+       if (i != 0)
+               return -EFAULT;
+
+       /* set all counts to new_value usually 0 */
+       for (i = 0; i < VISORNICSOPENMAX; i++) {
+               if (num_visornic_open[i]) {
+                       devdata = netdev_priv(num_visornic_open[i]);
+                       /* TODO update features bit in channel */
+               }
+       }
+
+       return count;
+}
+
+/**
+ *     visornic_serverdown_complete - IOPART went down, need to pause
+ *                                    device
+ *     @work: Work queue it was scheduled on
+ *
+ *     The IO partition has gone down and we need to do some cleanup
+ *     for when it comes back. Treat the IO partition as the link
+ *     being down.
+ *     Returns void.
+ */
+static void
+visornic_serverdown_complete(struct work_struct *work)
+{
+       struct visornic_devdata *devdata;
+       struct net_device *netdev;
+       unsigned long flags;
+       int i = 0, count = 0;
+
+       devdata = container_of(work, struct visornic_devdata,
+                              serverdown_completion);
+       netdev = devdata->netdev;
+
+       /* Stop using datachan */
+       visor_thread_stop(&devdata->threadinfo);
+
+       /* Inform Linux that the link is down */
+       netif_carrier_off(netdev);
+       netif_stop_queue(netdev);
+
+       /* Free the skb for XMITs that haven't been serviced by the server
+        * We shouldn't have to inform Linux about these IOs because they
+        * are "lost in the ethernet"
+        */
+       skb_queue_purge(&devdata->xmitbufhead);
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       /* free rcv buffers */
+       for (i = 0; i < devdata->num_rcv_bufs; i++) {
+               if (devdata->rcvbuf[i]) {
+                       kfree_skb(devdata->rcvbuf[i]);
+                       devdata->rcvbuf[i] = NULL;
+                       count++;
+               }
+       }
+       atomic_set(&devdata->num_rcvbuf_in_iovm, 0);
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       devdata->server_down = true;
+       devdata->server_change_state = false;
+}
+
+/**
+ *     visornic_serverdown - Command has notified us that IOPARt is down
+ *     @devdata: device that is being managed by IOPART
+ *
+ *     Schedule the work needed to handle the server down request. Make
+ *     sure we haven't already handled the server change state event.
+ *     Returns 0 if we scheduled the work, -EINVAL on error.
+ */
+static int
+visornic_serverdown(struct visornic_devdata *devdata)
+{
+       if (!devdata->server_down && !devdata->server_change_state) {
+               devdata->server_change_state = true;
+               queue_work(visornic_serverdown_workqueue,
+                          &devdata->serverdown_completion);
+       } else if (devdata->server_change_state) {
+               return -EINVAL;
+       }
+       return 0;
+}
+
+/**
+ *     alloc_rcv_buf   - alloc rcv buffer to be given to the IO Partition.
+ *     @netdev: network adapter the rcv bufs are attached too.
+ *
+ *     Create an sk_buff (rcv_buf) that will be passed to the IO Partition
+ *     so that it can write rcv data into our memory space.
+ *     Return pointer to sk_buff
+ */
+static struct sk_buff *
+alloc_rcv_buf(struct net_device *netdev)
+{
+       struct sk_buff *skb;
+
+       /* NOTE: the first fragment in each rcv buffer is pointed to by
+        * rcvskb->data. For now all rcv buffers will be RCVPOST_BUF_SIZE
+        * in length, so the firstfrag is large enough to hold 1514.
+        */
+       skb = alloc_skb(RCVPOST_BUF_SIZE, GFP_ATOMIC);
+       if (!skb)
+               return NULL;
+       skb->dev = netdev;
+       skb->len = RCVPOST_BUF_SIZE;
+       /* current value of mtu doesn't come into play here; large
+        * packets will just end up using multiple rcv buffers all of
+        * same size
+        */
+       skb->data_len = 0;      /* dev_alloc_skb already zeroes it out
+                                * for clarification.
+                                */
+       return skb;
+}
+
+/**
+ *     post_skb        - post a skb to the IO Partition.
+ *     @cmdrsp: cmdrsp packet to be send to the IO Partition
+ *     @devdata: visornic_devdata to post the skb too
+ *     @skb: skb to give to the IO partition
+ *
+ *     Send the skb to the IO Partition.
+ *     Returns void
+ */
+static inline void
+post_skb(struct uiscmdrsp *cmdrsp,
+        struct visornic_devdata *devdata, struct sk_buff *skb)
+{
+       cmdrsp->net.buf = skb;
+       cmdrsp->net.rcvpost.frag.pi_pfn = page_to_pfn(virt_to_page(skb->data));
+       cmdrsp->net.rcvpost.frag.pi_off =
+               (unsigned long)skb->data & PI_PAGE_MASK;
+       cmdrsp->net.rcvpost.frag.pi_len = skb->len;
+       cmdrsp->net.rcvpost.unique_num = devdata->uniquenum;
+
+       if ((cmdrsp->net.rcvpost.frag.pi_off + skb->len) <= PI_PAGE_SIZE) {
+               cmdrsp->net.type = NET_RCV_POST;
+               cmdrsp->cmdtype = CMD_NET_TYPE;
+               visorchannel_signalinsert(devdata->dev->visorchannel,
+                                         IOCHAN_TO_IOPART,
+                                         cmdrsp);
+               atomic_inc(&devdata->num_rcvbuf_in_iovm);
+               devdata->chstat.sent_post++;
+       }
+}
+
+/**
+ *     send_enbdis     - send NET_RCV_ENBDIS to IO Partition
+ *     @netdev: netdevice we are enable/disable, used as context
+ *              return value
+ *     @state: enable = 1/disable = 0
+ *     @devdata: visornic device we are enabling/disabling
+ *
+ *     Send the enable/disable message to the IO Partition.
+ *     Returns void
+ */
+static void
+send_enbdis(struct net_device *netdev, int state,
+           struct visornic_devdata *devdata)
+{
+       devdata->cmdrsp_rcv->net.enbdis.enable = state;
+       devdata->cmdrsp_rcv->net.enbdis.context = netdev;
+       devdata->cmdrsp_rcv->net.type = NET_RCV_ENBDIS;
+       devdata->cmdrsp_rcv->cmdtype = CMD_NET_TYPE;
+       visorchannel_signalinsert(devdata->dev->visorchannel,
+                                 IOCHAN_TO_IOPART,
+                                 devdata->cmdrsp_rcv);
+       devdata->chstat.sent_enbdis++;
+}
+
+/**
+ *     visornic_disable_with_timeout - Disable network adapter
+ *     @netdev: netdevice to disale
+ *     @timeout: timeout to wait for disable
+ *
+ *     Disable the network adapter and inform the IO Partition that we
+ *     are disabled, reclaim memory from rcv bufs.
+ *     Returns 0 on success, negative for failure of IO Partition
+ *     responding.
+ *
+ */
+static int
+visornic_disable_with_timeout(struct net_device *netdev, const int timeout)
+{
+       struct visornic_devdata *devdata = netdev_priv(netdev);
+       int i;
+       unsigned long flags;
+       int wait = 0;
+
+       /* stop the transmit queue so nothing more can be transmitted */
+       netif_stop_queue(netdev);
+
+       /* send a msg telling the other end we are stopping incoming pkts */
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       devdata->enabled = 0;
+       devdata->enab_dis_acked = 0; /* must wait for ack */
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       /* send disable and wait for ack -- don't hold lock when sending
+        * disable because if the queue is full, insert might sleep.
+        */
+       send_enbdis(netdev, 0, devdata);
+
+       /* wait for ack to arrive before we try to free rcv buffers
+        * NOTE: the other end automatically unposts the rcv buffers when
+        * when it gets a disable.
+        */
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       while ((timeout == VISORNIC_INFINITE_RESPONSE_WAIT) ||
+              (wait < timeout)) {
+               if (devdata->enab_dis_acked)
+                       break;
+               if (devdata->server_down || devdata->server_change_state) {
+                       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+                       return -EIO;
+               }
+               set_current_state(TASK_INTERRUPTIBLE);
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               wait += schedule_timeout(msecs_to_jiffies(10));
+               spin_lock_irqsave(&devdata->priv_lock, flags);
+       }
+
+       /* Wait for usage to go to 1 (no other users) before freeing
+        * rcv buffers
+        */
+       if (atomic_read(&devdata->usage) > 1) {
+               while (1) {
+                       set_current_state(TASK_INTERRUPTIBLE);
+                       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+                       schedule_timeout(msecs_to_jiffies(10));
+                       spin_lock_irqsave(&devdata->priv_lock, flags);
+                       if (atomic_read(&devdata->usage))
+                               break;
+               }
+       }
+
+       /* we've set enabled to 0, so we can give up the lock. */
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       /* Free rcv buffers - other end has automatically unposed them on
+        * disable
+        */
+       for (i = 0; i < devdata->num_rcv_bufs; i++) {
+               if (devdata->rcvbuf[i]) {
+                       kfree_skb(devdata->rcvbuf[i]);
+                       devdata->rcvbuf[i] = NULL;
+               }
+       }
+
+       /* remove references from array */
+       for (i = 0; i < VISORNICSOPENMAX; i++)
+               if (num_visornic_open[i] == netdev) {
+                       num_visornic_open[i] = NULL;
+                       break;
+               }
+
+       return 0;
+}
+
+/**
+ *     init_rcv_bufs  -- initialize receive bufs and send them to the IO Part
+ *     @netdev: struct netdevice
+ *     @devdata: visornic_devdata
+ *
+ *     Allocate rcv buffers and post them to the IO Partition.
+ *     Return 0 for success, and negative for failure.
+ */
+static int
+init_rcv_bufs(struct net_device *netdev, struct visornic_devdata *devdata)
+{
+       int i, count;
+
+       /* allocate fixed number of receive buffers to post to uisnic
+        * post receive buffers after we've allocated a required amount
+        */
+       for (i = 0; i < devdata->num_rcv_bufs; i++) {
+               devdata->rcvbuf[i] = alloc_rcv_buf(netdev);
+               if (!devdata->rcvbuf[i])
+                       break; /* if we failed to allocate one let us stop */
+       }
+       if (i == 0) /* couldn't even allocate one -- bail out */
+               return -ENOMEM;
+       count = i;
+
+       /* Ensure we can alloc 2/3rd of the requeested number of buffers.
+        * 2/3 is an arbitrary choice; used also in ndis init.c
+        */
+       if (count < ((2 * devdata->num_rcv_bufs) / 3)) {
+               /* free receive buffers we did alloc and then bail out */
+               for (i = 0; i < count; i++) {
+                       kfree_skb(devdata->rcvbuf[i]);
+                       devdata->rcvbuf[i] = NULL;
+               }
+               return -ENOMEM;
+       }
+
+       /* post receive buffers to receive incoming input - without holding
+        * lock - we've not enabled nor started the queue so there shouldn't
+        * be any rcv or xmit activity
+        */
+       for (i = 0; i < count; i++)
+               post_skb(devdata->cmdrsp_rcv, devdata, devdata->rcvbuf[i]);
+
+       return 0;
+}
+
+/**
+ *     visornic_enable_with_timeout    - send enable to IO Part
+ *     @netdev: struct net_device
+ *     @timeout: Time to wait for the ACK from the enable
+ *
+ *     Sends enable to IOVM, inits, and posts receive buffers to IOVM
+ *     timeout is defined in msecs (timeout of 0 specifies infinite wait)
+ *     Return 0 for success, negavite for failure.
+ */
+static int
+visornic_enable_with_timeout(struct net_device *netdev, const int timeout)
+{
+       int i;
+       struct visornic_devdata *devdata = netdev_priv(netdev);
+       unsigned long flags;
+       int wait = 0;
+
+       /* NOTE: the other end automatically unposts the rcv buffers when it
+        * gets a disable.
+        */
+       i = init_rcv_bufs(netdev, devdata);
+       if (i < 0)
+               return i;
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       devdata->enabled = 1;
+
+       /* now we're ready, let's send an ENB to uisnic but until we get
+        * an ACK back from uisnic, we'll drop the packets
+        */
+       devdata->n_rcv_packets_not_accepted = 0;
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       /* send enable and wait for ack -- don't hold lock when sending enable
+        * because if the queue is full, insert might sleep.
+        */
+       send_enbdis(netdev, 1, devdata);
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       while ((timeout == VISORNIC_INFINITE_RESPONSE_WAIT) ||
+              (wait < timeout)) {
+               if (devdata->enab_dis_acked)
+                       break;
+               if (devdata->server_down || devdata->server_change_state) {
+                       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+                       return -EIO;
+               }
+               set_current_state(TASK_INTERRUPTIBLE);
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               wait += schedule_timeout(msecs_to_jiffies(10));
+               spin_lock_irqsave(&devdata->priv_lock, flags);
+       }
+
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       if (!devdata->enab_dis_acked)
+               return -EIO;
+
+       /* find an open slot in the array to save off VisorNic references
+        * for debug
+        */
+       for (i = 0; i < VISORNICSOPENMAX; i++) {
+               if (!num_visornic_open[i]) {
+                       num_visornic_open[i] = netdev;
+                       break;
+               }
+       }
+
+       return 0;
+}
+
+/**
+ *     visornic_timeout_reset  - handle xmit timeout resets
+ *     @work   work item that scheduled the work
+ *
+ *     Transmit Timeouts are typically handled by resetting the
+ *     device for our virtual NIC we will send a Disable and Enable
+ *     to the IOVM. If it doesn't respond we will trigger a serverdown.
+ */
+static void
+visornic_timeout_reset(struct work_struct *work)
+{
+       struct visornic_devdata *devdata;
+       struct net_device *netdev;
+       int response = 0;
+
+       devdata = container_of(work, struct visornic_devdata, timeout_reset);
+       netdev = devdata->netdev;
+
+       netif_stop_queue(netdev);
+       response = visornic_disable_with_timeout(netdev, 100);
+       if (response)
+               goto call_serverdown;
+
+       response = visornic_enable_with_timeout(netdev, 100);
+       if (response)
+               goto call_serverdown;
+       netif_wake_queue(netdev);
+
+       return;
+
+call_serverdown:
+       visornic_serverdown(devdata);
+}
+
+/**
+ *     visornic_open - Enable the visornic device and mark the queue started
+ *     @netdev: netdevice to start
+ *
+ *      Enable the device and start the transmit queue.
+ *      Return 0 for success
+ */
+static int
+visornic_open(struct net_device *netdev)
+{
+       visornic_enable_with_timeout(netdev, VISORNIC_INFINITE_RESPONSE_WAIT);
+
+       /* start the interface's transmit queue, allowing it to accept
+        * packets for transmission
+        */
+       netif_start_queue(netdev);
+
+       return 0;
+}
+
+/**
+ *     visornic_close - Disables the visornic device and stops the queues
+ *     @netdev: netdevice to start
+ *
+ *      Disable the device and stop the transmit queue.
+ *      Return 0 for success
+ */
+static int
+visornic_close(struct net_device *netdev)
+{
+       netif_stop_queue(netdev);
+       visornic_disable_with_timeout(netdev, VISORNIC_INFINITE_RESPONSE_WAIT);
+
+       return 0;
+}
+
+/**
+ *     visornic_xmit - send a packet to the IO Partition
+ *     @skb: Packet to be sent
+ *     @netdev: net device the packet is being sent from
+ *
+ *     Convert the skb to a cmdrsp so the IO Partition can undersand it.
+ *     Send the XMIT command to the IO Partition for processing. This
+ *     function is protected from concurrent calls by a spinlock xmit_lock
+ *     in the net_device struct, but as soon as the function returns it
+ *     can be called again.
+ *     Returns NETDEV_TX_OK for success, NETDEV_TX_BUSY for error.
+ */
+static int
+visornic_xmit(struct sk_buff *skb, struct net_device *netdev)
+{
+       struct visornic_devdata *devdata;
+       int len, firstfraglen, padlen;
+       struct uiscmdrsp *cmdrsp = NULL;
+       unsigned long flags;
+
+       devdata = netdev_priv(netdev);
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+
+       if (netif_queue_stopped(netdev) || devdata->server_down ||
+           devdata->server_change_state) {
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               devdata->busy_cnt++;
+               return NETDEV_TX_BUSY;
+       }
+
+       /* sk_buff struct is used to host network data throughout all the
+        * linux network subsystems
+        */
+       len = skb->len;
+
+       /* skb->len is the FULL length of data (including fragmentary portion)
+        * skb->data_len is the length of the fragment portion in frags
+        * skb->len - skb->data_len is size of the 1st fragment in skb->data
+        * calculate the length of the first fragment that skb->data is
+        * pointing to
+        */
+       firstfraglen = skb->len - skb->data_len;
+       if (firstfraglen < ETH_HEADER_SIZE) {
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               devdata->busy_cnt++;
+               return NETDEV_TX_BUSY;
+       }
+
+       if ((len < ETH_MIN_PACKET_SIZE) &&
+           ((skb_end_pointer(skb) - skb->data) >= ETH_MIN_PACKET_SIZE)) {
+               /* pad the packet out to minimum size */
+               padlen = ETH_MIN_PACKET_SIZE - len;
+               memset(&skb->data[len], 0, padlen);
+               skb->tail += padlen;
+               skb->len += padlen;
+               len += padlen;
+               firstfraglen += padlen;
+       }
+
+       cmdrsp = devdata->xmit_cmdrsp;
+       /* clear cmdrsp */
+       memset(cmdrsp, 0, SIZEOF_CMDRSP);
+       cmdrsp->net.type = NET_XMIT;
+       cmdrsp->cmdtype = CMD_NET_TYPE;
+
+       /* save the pointer to skb -- we'll need it for completion */
+       cmdrsp->net.buf = skb;
+
+       if (((devdata->chstat.sent_xmit >= devdata->chstat.got_xmit_done) &&
+            (devdata->chstat.sent_xmit - devdata->chstat.got_xmit_done >=
+            devdata->max_outstanding_net_xmits)) ||
+            ((devdata->chstat.sent_xmit < devdata->chstat.got_xmit_done) &&
+            (ULONG_MAX - devdata->chstat.got_xmit_done +
+             devdata->chstat.sent_xmit >=
+             devdata->max_outstanding_net_xmits))) {
+               /* too many NET_XMITs queued over to IOVM - need to wait
+                */
+               devdata->chstat.reject_count++;
+               if (!devdata->queuefullmsg_logged &&
+                   ((devdata->chstat.reject_count & 0x3ff) == 1))
+                       devdata->queuefullmsg_logged = 1;
+               netif_stop_queue(netdev);
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               devdata->busy_cnt++;
+               return NETDEV_TX_BUSY;
+       }
+       if (devdata->queuefullmsg_logged)
+               devdata->queuefullmsg_logged = 0;
+
+       if (skb->ip_summed == CHECKSUM_UNNECESSARY) {
+               cmdrsp->net.xmt.lincsum.valid = 1;
+               cmdrsp->net.xmt.lincsum.protocol = skb->protocol;
+               if (skb_transport_header(skb) > skb->data) {
+                       cmdrsp->net.xmt.lincsum.hrawoff =
+                               skb_transport_header(skb) - skb->data;
+                       cmdrsp->net.xmt.lincsum.hrawoff = 1;
+               }
+               if (skb_network_header(skb) > skb->data) {
+                       cmdrsp->net.xmt.lincsum.nhrawoff =
+                               skb_network_header(skb) - skb->data;
+                       cmdrsp->net.xmt.lincsum.nhrawoffv = 1;
+               }
+               cmdrsp->net.xmt.lincsum.csum = skb->csum;
+       } else {
+               cmdrsp->net.xmt.lincsum.valid = 0;
+       }
+
+       /* save off the length of the entire data packet */
+       cmdrsp->net.xmt.len = len;
+
+       /* copy ethernet header from first frag into ocmdrsp
+        * - everything else will be pass in frags & DMA'ed
+        */
+       memcpy(cmdrsp->net.xmt.ethhdr, skb->data, ETH_HEADER_SIZE);
+       /* copy frags info - from skb->data we need to only provide access
+        * beyond eth header
+        */
+       cmdrsp->net.xmt.num_frags =
+               visor_copy_fragsinfo_from_skb(skb, firstfraglen,
+                                             MAX_PHYS_INFO,
+                                             cmdrsp->net.xmt.frags);
+       if (cmdrsp->net.xmt.num_frags == -1) {
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               devdata->busy_cnt++;
+               return NETDEV_TX_BUSY;
+       }
+
+       if (!visorchannel_signalinsert(devdata->dev->visorchannel,
+                                      IOCHAN_TO_IOPART, cmdrsp)) {
+               netif_stop_queue(netdev);
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               devdata->busy_cnt++;
+               return NETDEV_TX_BUSY;
+       }
+
+       /* Track the skbs that have been sent to the IOVM for XMIT */
+       skb_queue_head(&devdata->xmitbufhead, skb);
+
+       /* set the last transmission start time
+        * linux doc says: Do not forget to update netdev->trans_start to
+        * jiffies after each new tx packet is given to the hardware.
+        */
+       netdev->trans_start = jiffies;
+
+       /* update xmt stats */
+       devdata->net_stats.tx_packets++;
+       devdata->net_stats.tx_bytes += skb->len;
+       devdata->chstat.sent_xmit++;
+
+       /* check to see if we have hit the high watermark for
+        * netif_stop_queue()
+        */
+       if (((devdata->chstat.sent_xmit >= devdata->chstat.got_xmit_done) &&
+            (devdata->chstat.sent_xmit - devdata->chstat.got_xmit_done >=
+             devdata->upper_threshold_net_xmits)) ||
+           ((devdata->chstat.sent_xmit < devdata->chstat.got_xmit_done) &&
+            (ULONG_MAX - devdata->chstat.got_xmit_done +
+             devdata->chstat.sent_xmit >=
+             devdata->upper_threshold_net_xmits))) {
+               /* too many NET_XMITs queued over to IOVM - need to wait */
+               netif_stop_queue(netdev); /* calling stop queue - call
+                                          * netif_wake_queue() after lower
+                                          * threshold
+                                          */
+               devdata->flow_control_upper_hits++;
+       }
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       /* skb will be freed when we get back NET_XMIT_DONE */
+       return NETDEV_TX_OK;
+}
+
+/**
+ *     visornic_get_stats - returns net_stats of the visornic device
+ *     @netdev: netdevice
+ *
+ *     Returns the net_device_stats for the device
+ */
+static struct net_device_stats *
+visornic_get_stats(struct net_device *netdev)
+{
+       struct visornic_devdata *devdata = netdev_priv(netdev);
+
+       return &devdata->net_stats;
+}
+
+/**
+ *     visornic_ioctl - ioctl function for netdevice.
+ *     @netdev: netdevice
+ *     @ifr: ignored
+ *     @cmd: ignored
+ *
+ *     Currently not supported.
+ *     Returns EOPNOTSUPP
+ */
+static int
+visornic_ioctl(struct net_device *netdev, struct ifreq *ifr, int cmd)
+{
+       return -EOPNOTSUPP;
+}
+
+/**
+ *     visornic_change_mtu - changes mtu of device.
+ *     @netdev: netdevice
+ *     @new_mtu: value of new mtu
+ *
+ *     MTU cannot be changed by system, must be changed via
+ *     CONTROLVM message. All vnics and pnics in a switch have
+ *     to have the same MTU for everything to work.
+ *     Currently not supported.
+ *     Returns EINVAL
+ */
+static int
+visornic_change_mtu(struct net_device *netdev, int new_mtu)
+{
+       return -EINVAL;
+}
+
+/**
+ *     visornic_set_multi - changes mtu of device.
+ *     @netdev: netdevice
+ *
+ *     Only flag we support currently is IFF_PROMISC
+ *     Returns void
+ */
+static void
+visornic_set_multi(struct net_device *netdev)
+{
+       struct uiscmdrsp *cmdrsp;
+       struct visornic_devdata *devdata = netdev_priv(netdev);
+
+       /* any filtering changes */
+       if (devdata->old_flags != netdev->flags) {
+               if ((netdev->flags & IFF_PROMISC) !=
+                   (devdata->old_flags & IFF_PROMISC)) {
+                       cmdrsp = kmalloc(SIZEOF_CMDRSP, GFP_ATOMIC);
+                       if (!cmdrsp)
+                               return;
+                       cmdrsp->cmdtype = CMD_NET_TYPE;
+                       cmdrsp->net.type = NET_RCV_PROMISC;
+                       cmdrsp->net.enbdis.context = netdev;
+                       cmdrsp->net.enbdis.enable =
+                               (netdev->flags & IFF_PROMISC);
+                       visorchannel_signalinsert(devdata->dev->visorchannel,
+                                                 IOCHAN_TO_IOPART,
+                                                 cmdrsp);
+                       kfree(cmdrsp);
+               }
+               devdata->old_flags = netdev->flags;
+       }
+}
+
+/**
+ *     visornic_xmit_timeout - request to timeout the xmit
+ *     @netdev
+ *
+ *     Queue the work and return. Make sure we have not already
+ *     been informed the IO Partition is gone, if it is gone
+ *     we will already timeout the xmits.
+ */
+static void
+visornic_xmit_timeout(struct net_device *netdev)
+{
+       struct visornic_devdata *devdata = netdev_priv(netdev);
+       unsigned long flags;
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       /* Ensure that a ServerDown message hasn't been received */
+       if (!devdata->enabled ||
+           (devdata->server_down && !devdata->server_change_state)) {
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               return;
+       }
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       queue_work(visornic_timeout_reset_workqueue, &devdata->timeout_reset);
+}
+
+/**
+ *     repost_return   - repost rcv bufs that have come back
+ *     @cmdrsp: io channel command struct to post
+ *     @devdata: visornic devdata for the device
+ *     @skb: skb
+ *     @netdev: netdevice
+ *
+ *     Repost rcv buffers that have been returned to us when
+ *     we are finished with them.
+ *     Returns 0 for success, -1 for error.
+ */
+static inline int
+repost_return(struct uiscmdrsp *cmdrsp, struct visornic_devdata *devdata,
+             struct sk_buff *skb, struct net_device *netdev)
+{
+       struct net_pkt_rcv copy;
+       int i = 0, cc, numreposted;
+       int found_skb = 0;
+       int status = 0;
+
+       copy = cmdrsp->net.rcv;
+       switch (copy.numrcvbufs) {
+       case 0:
+               devdata->n_rcv0++;
+               break;
+       case 1:
+               devdata->n_rcv1++;
+               break;
+       case 2:
+               devdata->n_rcv2++;
+               break;
+       default:
+               devdata->n_rcvx++;
+               break;
+       }
+       for (cc = 0, numreposted = 0; cc < copy.numrcvbufs; cc++) {
+               for (i = 0; i < devdata->num_rcv_bufs; i++) {
+                       if (devdata->rcvbuf[i] != copy.rcvbuf[cc])
+                               continue;
+
+                       if ((skb) && devdata->rcvbuf[i] == skb) {
+                               devdata->found_repost_rcvbuf_cnt++;
+                               found_skb = 1;
+                               devdata->repost_found_skb_cnt++;
+                       }
+                       devdata->rcvbuf[i] = alloc_rcv_buf(netdev);
+                       if (!devdata->rcvbuf[i]) {
+                               devdata->num_rcv_bufs_could_not_alloc++;
+                               devdata->alloc_failed_in_repost_rtn_cnt++;
+                               status = -ENOMEM;
+                               break;
+                       }
+                       post_skb(cmdrsp, devdata, devdata->rcvbuf[i]);
+                       numreposted++;
+                       break;
+               }
+       }
+       if (numreposted != copy.numrcvbufs) {
+               devdata->n_repost_deficit++;
+               status = -EINVAL;
+       }
+       if (skb) {
+               if (found_skb) {
+                       kfree_skb(skb);
+               } else {
+                       status = -EINVAL;
+                       devdata->bad_rcv_buf++;
+               }
+       }
+       atomic_dec(&devdata->usage);
+       return status;
+}
+
+/**
+ *     visornic_rx - Handle receive packets coming back from IO Part
+ *     @cmdrsp: Receive packet returned from IO Part
+ *
+ *     Got a receive packet back from the IO Part, handle it and send
+ *     it up the stack.
+ *     Returns void
+ */
+static void
+visornic_rx(struct uiscmdrsp *cmdrsp)
+{
+       struct visornic_devdata *devdata;
+       struct sk_buff *skb, *prev, *curr;
+       struct net_device *netdev;
+       int cc, currsize, off, status;
+       struct ethhdr *eth;
+       unsigned long flags;
+#ifdef DEBUG
+       struct phys_info testfrags[MAX_PHYS_INFO];
+#endif
+
+       /* post new rcv buf to the other end using the cmdrsp we have at hand
+        * post it without holding lock - but we'll use the signal lock to
+        * synchronize the queue insert the cmdrsp that contains the net.rcv
+        * is the one we are using to repost, so copy the info we need from it.
+        */
+       skb = cmdrsp->net.buf;
+       netdev = skb->dev;
+
+       if (!netdev) {
+               /* We must have previously downed this network device and
+                * this skb and device is no longer valid. This also means
+                * the skb reference was removed from devdata->rcvbuf so no
+                * need to search for it.
+                * All we can do is free the skb and return.
+                * Note: We crash if we try to log this here.
+                */
+               kfree_skb(skb);
+               return;
+       }
+
+       devdata = netdev_priv(netdev);
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       atomic_dec(&devdata->num_rcvbuf_in_iovm);
+
+       /* update rcv stats - call it with priv_lock held */
+       devdata->net_stats.rx_packets++;
+       devdata->net_stats.rx_bytes = skb->len;
+
+       atomic_inc(&devdata->usage);    /* don't want a close to happen before
+                                        *  we're done here
+                                        */
+
+       /* set length to how much was ACTUALLY received -
+        * NOTE: rcv_done_len includes actual length of data rcvd
+        * including ethhdr
+        */
+       skb->len = cmdrsp->net.rcv.rcv_done_len;
+
+       /* test enabled while holding lock */
+       if (!(devdata->enabled && devdata->enab_dis_acked)) {
+               /* don't process it unless we're in enable mode and until
+                * we've gotten an ACK saying the other end got our RCV enable
+                */
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+               repost_return(cmdrsp, devdata, skb, netdev);
+               return;
+       }
+
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+       /* when skb was allocated, skb->dev, skb->data, skb->len and
+        * skb->data_len were setup. AND, data has already put into the
+        * skb (both first frag and in frags pages)
+        * NOTE: firstfragslen is the amount of data in skb->data and that
+        * which is not in nr_frags or frag_list. This is now simply
+        * RCVPOST_BUF_SIZE. bump tail to show how much data is in
+        * firstfrag & set data_len to show rest see if we have to chain
+        * frag_list.
+        */
+       if (skb->len > RCVPOST_BUF_SIZE) {      /* do PRECAUTIONARY check */
+               if (cmdrsp->net.rcv.numrcvbufs < 2) {
+                       if (repost_return(cmdrsp, devdata, skb, netdev) < 0)
+                               dev_err(&devdata->netdev->dev,
+                                       "repost_return failed");
+                       return;
+               }
+               /* length rcvd is greater than firstfrag in this skb rcv buf  */
+               skb->tail += RCVPOST_BUF_SIZE;  /* amount in skb->data */
+               skb->data_len = skb->len - RCVPOST_BUF_SIZE;    /* amount that
+                                                                  will be in
+                                                                  frag_list */
+       } else {
+               /* data fits in this skb - no chaining - do
+                * PRECAUTIONARY check
+                */
+               if (cmdrsp->net.rcv.numrcvbufs != 1) {  /* should be 1 */
+                       if (repost_return(cmdrsp, devdata, skb, netdev) < 0)
+                               dev_err(&devdata->netdev->dev,
+                                       "repost_return failed");
+                       return;
+               }
+               skb->tail += skb->len;
+               skb->data_len = 0;      /* nothing rcvd in frag_list */
+       }
+       off = skb_tail_pointer(skb) - skb->data;
+
+       /* amount we bumped tail by in the head skb
+        * it is used to calculate the size of each chained skb below
+        * it is also used to index into bufline to continue the copy
+        * (for chansocktwopc)
+        * if necessary chain the rcv skbs together.
+        * NOTE: index 0 has the same as cmdrsp->net.rcv.skb; we need to
+        * chain the rest to that one.
+        * - do PRECAUTIONARY check
+        */
+       if (cmdrsp->net.rcv.rcvbuf[0] != skb) {
+               if (repost_return(cmdrsp, devdata, skb, netdev) < 0)
+                       dev_err(&devdata->netdev->dev, "repost_return failed");
+               return;
+       }
+
+       if (cmdrsp->net.rcv.numrcvbufs > 1) {
+               /* chain the various rcv buffers into the skb's frag_list. */
+               /* Note: off was initialized above  */
+               for (cc = 1, prev = NULL;
+                    cc < cmdrsp->net.rcv.numrcvbufs; cc++) {
+                       curr = (struct sk_buff *)cmdrsp->net.rcv.rcvbuf[cc];
+                       curr->next = NULL;
+                       if (!prev)      /* start of list- set head */
+                               skb_shinfo(skb)->frag_list = curr;
+                       else
+                               prev->next = curr;
+                       prev = curr;
+
+                       /* should we set skb->len and skb->data_len for each
+                        * buffer being chained??? can't hurt!
+                        */
+                       currsize = min(skb->len - off,
+                                      (unsigned int)RCVPOST_BUF_SIZE);
+                       curr->len = currsize;
+                       curr->tail += currsize;
+                       curr->data_len = 0;
+                       off += currsize;
+               }
+#ifdef DEBUG
+               /* assert skb->len == off */
+               if (skb->len != off) {
+                       dev_err(&devdata->netdev->dev,
+                               "%s something wrong; skb->len:%d != off:%d\n",
+                               netdev->name, skb->len, off);
+               }
+               /* test code */
+               cc = util_copy_fragsinfo_from_skb("rcvchaintest", skb,
+                                                 RCVPOST_BUF_SIZE,
+                                                 MAX_PHYS_INFO, testfrags);
+               if (cc != cmdrsp->net.rcv.numrcvbufs) {
+                       dev_err(&devdata->netdev->dev,
+                               "**** %s Something wrong; rcvd chain length %d different from one we calculated %d\n",
+                               netdev->name, cmdrsp->net.rcv.numrcvbufs, cc);
+               }
+               for (i = 0; i < cc; i++) {
+                       dev_inf(&devdata->netdev->dev,
+                               "test:RCVPOST_BUF_SIZE:%d[%d] pfn:%llu off:0x%x len:%d\n",
+                               RCVPOST_BUF_SIZE, i, testfrags[i].pi_pfn,
+                               testfrags[i].pi_off, testfrags[i].pi_len);
+               }
+#endif
+       }
+
+       /* set up packet's protocl type using ethernet header - this
+        * sets up skb->pkt_type & it also PULLS out the eth header
+        */
+       skb->protocol = eth_type_trans(skb, netdev);
+
+       eth = eth_hdr(skb);
+
+       skb->csum = 0;
+       skb->ip_summed = CHECKSUM_NONE;
+
+       do {
+               if (netdev->flags & IFF_PROMISC)
+                       break;  /* accept all packets */
+               if (skb->pkt_type == PACKET_BROADCAST) {
+                       if (netdev->flags & IFF_BROADCAST)
+                               break;  /* accept all broadcast packets */
+               } else if (skb->pkt_type == PACKET_MULTICAST) {
+                       if ((netdev->flags & IFF_MULTICAST) &&
+                           (netdev_mc_count(netdev))) {
+                               struct netdev_hw_addr *ha;
+                               int found_mc = 0;
+
+                               /* only accept multicast packets that we can
+                                * find in our multicast address list
+                                */
+                               netdev_for_each_mc_addr(ha, netdev) {
+                                       if (ether_addr_equal(eth->h_dest,
+                                                            ha->addr)) {
+                                               found_mc = 1;
+                                               break;
+                                       }
+                               }
+                               if (found_mc)
+                                       break;  /* accept packet, dest
+                                                  matches a multicast
+                                                  address */
+                       }
+               } else if (skb->pkt_type == PACKET_HOST) {
+                       break;  /* accept packet, h_dest must match vnic
+                                  mac address */
+               } else if (skb->pkt_type == PACKET_OTHERHOST) {
+                       /* something is not right */
+                       dev_err(&devdata->netdev->dev,
+                               "**** FAILED to deliver rcv packet to OS; name:%s Dest:%pM VNIC:%pM\n",
+                               netdev->name, eth->h_dest, netdev->dev_addr);
+               }
+               /* drop packet - don't forward it up to OS */
+               devdata->n_rcv_packets_not_accepted++;
+               repost_return(cmdrsp, devdata, skb, netdev);
+               return;
+       } while (0);
+
+       status = netif_rx(skb);
+       /* netif_rx returns various values, but "in practice most drivers
+        * ignore the return value
+        */
+
+       skb = NULL;
+       /*
+        * whether the packet got dropped or handled, the skb is freed by
+        * kernel code, so we shouldn't free it. but we should repost a
+        * new rcv buffer.
+        */
+       repost_return(cmdrsp, devdata, skb, netdev);
+}
+
+/**
+ *     devdata_initialize      - Initialize devdata structure
+ *     @devdata: visornic_devdata structure to initialize
+ *     #dev: visorbus_deviced it belongs to
+ *
+ *     Setup initial values for the visornic based on channel and default
+ *     values.
+ *     Returns a pointer to the devdata if successful, else NULL
+ */
+static struct visornic_devdata *
+devdata_initialize(struct visornic_devdata *devdata, struct visor_device *dev)
+{
+       int devnum = -1;
+
+       if (!devdata)
+               return NULL;
+       memset(devdata, '\0', sizeof(struct visornic_devdata));
+       spin_lock(&dev_num_pool_lock);
+       devnum = find_first_zero_bit(dev_num_pool, MAXDEVICES);
+       set_bit(devnum, dev_num_pool);
+       spin_unlock(&dev_num_pool_lock);
+       if (devnum == MAXDEVICES)
+               devnum = -1;
+       if (devnum < 0) {
+               kfree(devdata);
+               return NULL;
+       }
+       devdata->devnum = devnum;
+       devdata->dev = dev;
+       strncpy(devdata->name, dev_name(&dev->device), sizeof(devdata->name));
+       kref_init(&devdata->kref);
+       spin_lock(&lock_all_devices);
+       list_add_tail(&devdata->list_all, &list_all_devices);
+       spin_unlock(&lock_all_devices);
+       return devdata;
+}
+
+/**
+ *     devdata_release - Frees up a devdata
+ *     @mykref: kref to the devdata
+ *
+ *     Frees up a devdata.
+ *     Returns void
+ */
+static void devdata_release(struct kref *mykref)
+{
+       struct visornic_devdata *devdata =
+               container_of(mykref, struct visornic_devdata, kref);
+
+       spin_lock(&dev_num_pool_lock);
+       clear_bit(devdata->devnum, dev_num_pool);
+       spin_unlock(&dev_num_pool_lock);
+       spin_lock(&lock_all_devices);
+       list_del(&devdata->list_all);
+       spin_unlock(&lock_all_devices);
+       kfree(devdata);
+}
+
+static const struct net_device_ops visornic_dev_ops = {
+       .ndo_open = visornic_open,
+       .ndo_stop = visornic_close,
+       .ndo_start_xmit = visornic_xmit,
+       .ndo_get_stats = visornic_get_stats,
+       .ndo_do_ioctl = visornic_ioctl,
+       .ndo_change_mtu = visornic_change_mtu,
+       .ndo_tx_timeout = visornic_xmit_timeout,
+       .ndo_set_rx_mode = visornic_set_multi,
+};
+
+/**
+ *     send_rcv_posts_if_needed
+ *     @devdata: visornic device
+ *
+ *     Send receive buffers to the IO Partition.
+ *     Returns void
+ */
+static void
+send_rcv_posts_if_needed(struct visornic_devdata *devdata)
+{
+       int i;
+       struct net_device *netdev;
+       struct uiscmdrsp *cmdrsp = devdata->cmdrsp_rcv;
+       int cur_num_rcv_bufs_to_alloc, rcv_bufs_allocated;
+
+       /* don't do this until vnic is marked ready */
+       if (!(devdata->enabled && devdata->enab_dis_acked))
+               return;
+
+       netdev = devdata->netdev;
+       rcv_bufs_allocated = 0;
+       /* this code is trying to prevent getting stuck here forever,
+        * but still retry it if you cant allocate them all this time.
+        */
+       cur_num_rcv_bufs_to_alloc = devdata->num_rcv_bufs_could_not_alloc;
+       while (cur_num_rcv_bufs_to_alloc > 0) {
+               cur_num_rcv_bufs_to_alloc--;
+               for (i = 0; i < devdata->num_rcv_bufs; i++) {
+                       if (devdata->rcvbuf[i])
+                               continue;
+                       devdata->rcvbuf[i] = alloc_rcv_buf(netdev);
+                       if (!devdata->rcvbuf[i]) {
+                               devdata->alloc_failed_in_if_needed_cnt++;
+                               break;
+                       }
+                       rcv_bufs_allocated++;
+                       post_skb(cmdrsp, devdata, devdata->rcvbuf[i]);
+                       devdata->chstat.extra_rcvbufs_sent++;
+               }
+       }
+       devdata->num_rcv_bufs_could_not_alloc -= rcv_bufs_allocated;
+}
+
+/**
+ *     draing_queue    - drains the response queue
+ *     @cmdrsp: io channel command response message
+ *     @devdata: visornic device to drain
+ *
+ *     Drain the respones queue of any responses from the IO partition.
+ *     Process the responses as we get them.
+ *     Returns when response queue is empty or when the threadd stops.
+ */
+static void
+drain_queue(struct uiscmdrsp *cmdrsp, struct visornic_devdata *devdata)
+{
+       unsigned long flags;
+       struct net_device *netdev;
+
+       /* drain queue */
+       while (1) {
+               /* TODO: CLIENT ACQUIRE -- Don't really need this at the
+                * moment */
+               if (!visorchannel_signalremove(devdata->dev->visorchannel,
+                                              IOCHAN_FROM_IOPART,
+                                              cmdrsp))
+                       break; /* queue empty */
+
+               switch (cmdrsp->net.type) {
+               case NET_RCV:
+                       devdata->chstat.got_rcv++;
+                       /* process incoming packet */
+                       visornic_rx(cmdrsp);
+                       break;
+               case NET_XMIT_DONE:
+                       spin_lock_irqsave(&devdata->priv_lock, flags);
+                       devdata->chstat.got_xmit_done++;
+                       if (cmdrsp->net.xmtdone.xmt_done_result)
+                               devdata->chstat.xmit_fail++;
+                       /* only call queue wake if we stopped it */
+                       netdev = ((struct sk_buff *)cmdrsp->net.buf)->dev;
+                       /* ASSERT netdev == vnicinfo->netdev; */
+                       if ((netdev == devdata->netdev) &&
+                           netif_queue_stopped(netdev)) {
+                               /* check to see if we have crossed
+                                * the lower watermark for
+                                * netif_wake_queue()
+                                */
+                               if (((devdata->chstat.sent_xmit >=
+                                   devdata->chstat.got_xmit_done) &&
+                                   (devdata->chstat.sent_xmit -
+                                   devdata->chstat.got_xmit_done <=
+                                   devdata->lower_threshold_net_xmits)) ||
+                                   ((devdata->chstat.sent_xmit <
+                                   devdata->chstat.got_xmit_done) &&
+                                   (ULONG_MAX - devdata->chstat.got_xmit_done
+                                   + devdata->chstat.sent_xmit <=
+                                   devdata->lower_threshold_net_xmits))) {
+                                       /* enough NET_XMITs completed
+                                        * so can restart netif queue
+                                        */
+                                       netif_wake_queue(netdev);
+                                       devdata->flow_control_lower_hits++;
+                               }
+                       }
+                       skb_unlink(cmdrsp->net.buf, &devdata->xmitbufhead);
+                       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+                       kfree_skb(cmdrsp->net.buf);
+                       break;
+               case NET_RCV_ENBDIS_ACK:
+                       devdata->chstat.got_enbdisack++;
+                       netdev = (struct net_device *)
+                       cmdrsp->net.enbdis.context;
+                       spin_lock_irqsave(&devdata->priv_lock, flags);
+                       devdata->enab_dis_acked = 1;
+                       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+                       if (devdata->server_down &&
+                           devdata->server_change_state) {
+                               /* Inform Linux that the link is up */
+                               devdata->server_down = false;
+                               devdata->server_change_state = false;
+                               netif_wake_queue(netdev);
+                               netif_carrier_on(netdev);
+                       }
+                       break;
+               case NET_CONNECT_STATUS:
+                       netdev = devdata->netdev;
+                       if (cmdrsp->net.enbdis.enable == 1) {
+                               spin_lock_irqsave(&devdata->priv_lock, flags);
+                               devdata->enabled = cmdrsp->net.enbdis.enable;
+                               spin_unlock_irqrestore(&devdata->priv_lock,
+                                                      flags);
+                               netif_wake_queue(netdev);
+                               netif_carrier_on(netdev);
+                       } else {
+                               netif_stop_queue(netdev);
+                               netif_carrier_off(netdev);
+                               spin_lock_irqsave(&devdata->priv_lock, flags);
+                               devdata->enabled = cmdrsp->net.enbdis.enable;
+                               spin_unlock_irqrestore(&devdata->priv_lock,
+                                                      flags);
+                       }
+                       break;
+               default:
+                       break;
+               }
+               /* cmdrsp is now available for reuse  */
+
+               if (kthread_should_stop())
+                       break;
+       }
+}
+
+/**
+ *     process_incoming_rsps   - Checks the status of the response queue.
+ *     @v: void pointer to the visronic devdata
+ *
+ *     Main function of the vnic_incoming thread. Peridocially check the
+ *     response queue and drain it if needed.
+ *     Returns when thread has stopped.
+ */
+static int
+process_incoming_rsps(void *v)
+{
+       struct visornic_devdata *devdata = v;
+       struct uiscmdrsp *cmdrsp = NULL;
+       const int SZ = SIZEOF_CMDRSP;
+
+       cmdrsp = kmalloc(SZ, GFP_ATOMIC);
+       if (!cmdrsp)
+               complete_and_exit(&devdata->threadinfo.has_stopped, 0);
+
+       while (1) {
+               wait_event_interruptible_timeout(
+                       devdata->rsp_queue, (atomic_read(
+                                            &devdata->interrupt_rcvd) == 1),
+                               msecs_to_jiffies(devdata->thread_wait_ms));
+
+               /* periodically check to see if there are any rcf bufs which
+                * need to get sent to the IOSP. This can only happen if
+                * we run out of memory when trying to allocate skbs.
+                */
+               atomic_set(&devdata->interrupt_rcvd, 0);
+               send_rcv_posts_if_needed(devdata);
+               drain_queue(cmdrsp, devdata);
+               if (kthread_should_stop())
+                       break;
+       }
+
+       kfree(cmdrsp);
+       complete_and_exit(&devdata->threadinfo.has_stopped, 0);
+}
+
+/**
+ *     visornic_probe  - probe function for visornic devices
+ *     @dev: The visor device discovered
+ *
+ *     Called when visorbus discovers a visornic device on its
+ *     bus. It creates a new visornic ethernet adapter.
+ *     Returns 0 or negative for error.
+ */
+static int visornic_probe(struct visor_device *dev)
+{
+       struct visornic_devdata *devdata = NULL;
+       struct net_device *netdev = NULL;
+       int err;
+       int channel_offset = 0;
+       u64 features;
+
+       netdev = alloc_etherdev(sizeof(struct visornic_devdata));
+       if (!netdev)
+               return -ENOMEM;
+
+       netdev->netdev_ops = &visornic_dev_ops;
+       netdev->watchdog_timeo = (5 * HZ);
+       netdev->dev.parent = &dev->device;
+
+       /* Get MAC adddress from channel and read it into the device. */
+       netdev->addr_len = ETH_ALEN;
+       channel_offset = offsetof(struct spar_io_channel_protocol,
+                                 vnic.macaddr);
+       err = visorbus_read_channel(dev, channel_offset, netdev->dev_addr,
+                                   ETH_ALEN);
+       if (err < 0)
+               goto cleanup_netdev;
+
+       devdata = devdata_initialize(netdev_priv(netdev), dev);
+       if (!devdata) {
+               err = -ENOMEM;
+               goto cleanup_netdev;
+       }
+
+       devdata->netdev = netdev;
+       init_waitqueue_head(&devdata->rsp_queue);
+       spin_lock_init(&devdata->priv_lock);
+       devdata->enabled = 0; /* not yet */
+       atomic_set(&devdata->usage, 1);
+
+       /* Setup rcv bufs */
+       channel_offset = offsetof(struct spar_io_channel_protocol,
+                                 vnic.num_rcv_bufs);
+       err = visorbus_read_channel(dev, channel_offset,
+                                   &devdata->num_rcv_bufs, 4);
+       if (err)
+               goto cleanup_netdev;
+
+       devdata->rcvbuf = kmalloc(sizeof(struct sk_buff *) *
+                                 devdata->num_rcv_bufs, GFP_KERNEL);
+       if (!devdata->rcvbuf) {
+               err = -ENOMEM;
+               goto cleanup_rcvbuf;
+       }
+
+       /* set the net_xmit outstanding threshold */
+       /* always leave two slots open but you should have 3 at a minimum */
+       devdata->max_outstanding_net_xmits =
+               max(3, ((devdata->num_rcv_bufs / 3) - 2));
+       devdata->upper_threshold_net_xmits =
+               max(2, devdata->max_outstanding_net_xmits - 1);
+       devdata->lower_threshold_net_xmits =
+               max(1, devdata->max_outstanding_net_xmits / 2);
+
+       skb_queue_head_init(&devdata->xmitbufhead);
+
+       /* create a cmdrsp we can use to post and unpost rcv buffers */
+       devdata->cmdrsp_rcv = kmalloc(SIZEOF_CMDRSP, GFP_ATOMIC);
+       if (!devdata->cmdrsp_rcv) {
+               err = -ENOMEM;
+               goto cleanup_cmdrsp_rcv;
+       }
+       devdata->xmit_cmdrsp = kmalloc(SIZEOF_CMDRSP, GFP_ATOMIC);
+       if (!devdata->xmit_cmdrsp) {
+               err = -ENOMEM;
+               goto cleanup_xmit_cmdrsp;
+       }
+       INIT_WORK(&devdata->serverdown_completion,
+                 visornic_serverdown_complete);
+       INIT_WORK(&devdata->timeout_reset, visornic_timeout_reset);
+       devdata->server_down = false;
+       devdata->server_change_state = false;
+
+       /*set the default mtu */
+       channel_offset = offsetof(struct spar_io_channel_protocol,
+                                 vnic.mtu);
+       err = visorbus_read_channel(dev, channel_offset, &netdev->mtu, 4);
+       if (err)
+               goto cleanup_xmit_cmdrsp;
+
+       /* TODO: Setup Interrupt information */
+       /* Let's start our threads to get responses */
+       channel_offset = offsetof(struct spar_io_channel_protocol,
+                                 channel_header.features);
+       err = visorbus_read_channel(dev, channel_offset, &features, 8);
+       if (err)
+               goto cleanup_xmit_cmdrsp;
+
+       features |= ULTRA_IO_CHANNEL_IS_POLLING;
+       err = visorbus_write_channel(dev, channel_offset, &features, 8);
+       if (err)
+               goto cleanup_xmit_cmdrsp;
+
+       devdata->thread_wait_ms = 2;
+       visor_thread_start(&devdata->threadinfo, process_incoming_rsps,
+                          devdata, "vnic_incoming");
+
+       err = register_netdev(netdev);
+       if (err)
+               goto cleanup_thread_stop;
+
+       /* create debgug/sysfs directories */
+       devdata->eth_debugfs_dir = debugfs_create_dir(netdev->name,
+                                                     visornic_debugfs_dir);
+       if (!devdata->eth_debugfs_dir) {
+               err = -ENOMEM;
+               goto cleanup_thread_stop;
+       }
+
+       return 0;
+
+cleanup_thread_stop:
+       visor_thread_stop(&devdata->threadinfo);
+
+cleanup_xmit_cmdrsp:
+       kfree(devdata->xmit_cmdrsp);
+
+cleanup_cmdrsp_rcv:
+       kfree(devdata->cmdrsp_rcv);
+
+cleanup_rcvbuf:
+       kfree(devdata->rcvbuf);
+
+cleanup_netdev:
+       free_netdev(netdev);
+       return err;
+}
+
+/**
+ *     host_side_disappeared   - IO part is gone.
+ *     @devdata: device object
+ *
+ *     IO partition servicing this device is gone, do cleanup
+ *     Returns void.
+ */
+static void host_side_disappeared(struct visornic_devdata *devdata)
+{
+       unsigned long flags;
+
+       spin_lock_irqsave(&devdata->priv_lock, flags);
+       sprintf(devdata->name, "<dev#%d-history>", devdata->devnum);
+       devdata->dev = NULL;   /* indicate device destroyed */
+       spin_unlock_irqrestore(&devdata->priv_lock, flags);
+}
+
+/**
+ *     visornic_remove         - Called when visornic dev goes away
+ *     @dev: visornic device that is being removed
+ *
+ *     Called when DEVICE_DESTROY gets called to remove device.
+ *     Returns void
+ */
+static void visornic_remove(struct visor_device *dev)
+{
+       struct visornic_devdata *devdata = dev_get_drvdata(&dev->device);
+
+       if (!devdata)
+               return;
+       dev_set_drvdata(&dev->device, NULL);
+       host_side_disappeared(devdata);
+       kref_put(&devdata->kref, devdata_release);
+}
+
+/**
+ *     visornic_pause          - Called when IO Part disappears
+ *     @dev: visornic device that is being serviced
+ *     @complete_func: call when finished.
+ *
+ *     Called when the IO Partition has gone down. Need to free
+ *     up resources and wait for IO partition to come back. Mark
+ *     link as down and don't attempt any DMA. When we have freed
+ *     memory call the complete_func so that Command knows we are
+ *     done. If we don't call complete_func, IO part will never
+ *     come back.
+ *     Returns 0 for success.
+ */
+static int visornic_pause(struct visor_device *dev,
+                         visorbus_state_complete_func complete_func)
+{
+       struct visornic_devdata *devdata = dev_get_drvdata(&dev->device);
+
+       visornic_serverdown(devdata);
+       complete_func(dev, 0);
+       return 0;
+}
+
+/**
+ *     visornic_resume         - Called when IO part has recovered
+ *     @dev: visornic device that is being serviced
+ *     @compelte_func: call when finished
+ *
+ *     Called when the IO partition has recovered. Reestablish
+ *     connection to the IO part and set the link up. Okay to do
+ *     DMA again.
+ *     Returns 0 for success.
+ */
+static int visornic_resume(struct visor_device *dev,
+                          visorbus_state_complete_func complete_func)
+{
+       struct visornic_devdata *devdata;
+       struct net_device *netdev;
+       unsigned long flags;
+
+       devdata = dev_get_drvdata(&dev->device);
+       if (!devdata)
+               return -EINVAL;
+
+       netdev = devdata->netdev;
+
+       if (devdata->server_down && !devdata->server_change_state) {
+               devdata->server_change_state = true;
+               /* Must transition channel to ATTACHED state BEFORE
+                * we can start using the device again.
+                * TODO: State transitions
+                */
+               visor_thread_start(&devdata->threadinfo, process_incoming_rsps,
+                                  devdata, "vnic_incoming");
+               init_rcv_bufs(netdev, devdata);
+               spin_lock_irqsave(&devdata->priv_lock, flags);
+               devdata->enabled = 1;
+
+               /* Now we're ready, let's send an ENB to uisnic but until
+                * we get an ACK back from uisnic, we'll drop the packets
+                */
+               devdata->enab_dis_acked = 0;
+               spin_unlock_irqrestore(&devdata->priv_lock, flags);
+
+               /* send enable and wait for ack - don't hold lock when
+                * sending enable because if the queue if sull, insert
+                * might sleep.
+                */
+               send_enbdis(netdev, 1, devdata);
+       } else if (devdata->server_change_state) {
+               return -EIO;
+       }
+
+       complete_func(dev, 0);
+       return 0;
+}
+
+/**
+ *     visornic_init   - Init function
+ *
+ *     Init function for the visornic driver. Do initial driver setup
+ *     and wait for devices.
+ *     Returns 0 for success, negative for error.
+ */
+static int visornic_init(void)
+{
+       struct dentry *ret;
+       int err = -ENOMEM;
+
+       /* create workqueue for serverdown completion */
+       visornic_serverdown_workqueue =
+               create_singlethread_workqueue("visornic_serverdown");
+       if (!visornic_serverdown_workqueue)
+               return -ENOMEM;
+
+       /* create workqueue for tx timeout reset */
+       visornic_timeout_reset_workqueue =
+               create_singlethread_workqueue("visornic_timeout_reset");
+       if (!visornic_timeout_reset_workqueue)
+               return -ENOMEM;
+
+       visornic_debugfs_dir = debugfs_create_dir("visornic", NULL);
+       if (!visornic_debugfs_dir)
+               return err;
+
+       ret = debugfs_create_file("info", S_IRUSR, visornic_debugfs_dir, NULL,
+                                 &debugfs_info_fops);
+       if (!ret)
+               goto cleanup_debugfs;
+       ret = debugfs_create_file("enable_ints", S_IWUSR, visornic_debugfs_dir,
+                                 NULL, &debugfs_enable_ints_fops);
+       if (!ret)
+               goto cleanup_debugfs;
+
+       /* create workqueue for serverdown completion */
+       visornic_serverdown_workqueue =
+               create_singlethread_workqueue("visornic_serverdown");
+       if (!visornic_serverdown_workqueue)
+               goto cleanup_debugfs;
+
+       /* create workqueue for tx timeout reset */
+       visornic_timeout_reset_workqueue =
+               create_singlethread_workqueue("visornic_timeout_reset");
+       if (!visornic_timeout_reset_workqueue)
+               goto cleanup_workqueue;
+
+       spin_lock_init(&dev_num_pool_lock);
+       dev_num_pool = kzalloc(BITS_TO_LONGS(MAXDEVICES), GFP_KERNEL);
+       if (!dev_num_pool)
+               goto cleanup_workqueue;
+
+       visorbus_register_visor_driver(&visornic_driver);
+       return 0;
+
+cleanup_workqueue:
+       flush_workqueue(visornic_serverdown_workqueue);
+       destroy_workqueue(visornic_serverdown_workqueue);
+       if (visornic_timeout_reset_workqueue) {
+               flush_workqueue(visornic_timeout_reset_workqueue);
+               destroy_workqueue(visornic_timeout_reset_workqueue);
+       }
+cleanup_debugfs:
+       debugfs_remove_recursive(visornic_debugfs_dir);
+
+       return err;
+}
+
+/**
+ *     visornic_cleanup        - driver exit routine
+ *
+ *     Unregister driver from the bus and free up memory.
+ */
+static void visornic_cleanup(void)
+{
+       if (visornic_serverdown_workqueue) {
+               flush_workqueue(visornic_serverdown_workqueue);
+               destroy_workqueue(visornic_serverdown_workqueue);
+       }
+       if (visornic_timeout_reset_workqueue) {
+               flush_workqueue(visornic_timeout_reset_workqueue);
+               destroy_workqueue(visornic_timeout_reset_workqueue);
+       }
+       debugfs_remove_recursive(visornic_debugfs_dir);
+
+       visorbus_unregister_visor_driver(&visornic_driver);
+       kfree(dev_num_pool);
+       dev_num_pool = NULL;
+}
+
+module_init(visornic_init);
+module_exit(visornic_cleanup);
+
+MODULE_AUTHOR("Unisys");
+MODULE_LICENSE("GPL");
+MODULE_DESCRIPTION("sPAR nic driver for sparlinux: ver 1.0.0.0");
+MODULE_VERSION("1.0.0.0");