vxge: prefetch RxD descriptors
authorBenjamin LaHaise <ben.lahaise@neterion.com>
Tue, 4 Aug 2009 10:21:39 +0000 (10:21 +0000)
committerDavid S. Miller <davem@davemloft.net>
Wed, 5 Aug 2009 20:10:45 +0000 (13:10 -0700)
This patch prefetches RxD descriptors which helps to lower the latency of a
cache miss in vxge_hw_ring_rxd_next_completed.  This lowers the % of CPU
time used by vxge_hw_ring_rxd_next_completed() where the descriptor is
accessed in profiling netperf on a P4 Xeon from 1.5% to 1.0%.

Signed-off-by: Benjamin LaHaise <ben.lahaise@neterion.com>
Signed-off-by: Sreenivasa Honnur <sreenivasa.honnur@neterion.com>
Signed-off-by: Ramkrishna Vepa <ram.vepa@neterion.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
drivers/net/vxge/vxge-main.c
drivers/net/vxge/vxge-traffic.c

index 4b22513bed402ec195000eb206b94d76d56ad2c5..e93651c19f59ab0dde9f2860781bd19652f94c02 100644 (file)
@@ -445,6 +445,7 @@ vxge_rx_1b_compl(struct __vxge_hw_ring *ringh, void *dtr,
        vxge_hw_ring_replenish(ringh, 0);
 
        do {
+               prefetch((char *)dtr + L1_CACHE_BYTES);
                rx_priv = vxge_hw_ring_rxd_private_get(dtr);
                skb = rx_priv->skb;
                data_size = rx_priv->data_size;
index 0efb769894ef42b01a667b589e7182b3f09a65f8..fe3ae518c69c30b24eeb7e12ec61dfaa08983ebb 100644 (file)
@@ -731,6 +731,7 @@ vxge_hw_channel_dtr_try_complete(struct __vxge_hw_channel *channel, void **dtrh)
        vxge_assert(channel->compl_index < channel->length);
 
        *dtrh = channel->work_arr[channel->compl_index];
+       prefetch(*dtrh);
 }
 
 /*