net: optimise inet_proto_csum_replace4()
authorLEROY Christophe <christophe.leroy@c-s.fr>
Tue, 23 Sep 2014 08:54:37 +0000 (10:54 +0200)
committerDavid S. Miller <davem@davemloft.net>
Fri, 26 Sep 2014 20:14:17 +0000 (16:14 -0400)
csum_partial() is a generic function which is not optimised for small fixed
length calculations, and its use requires to store "from" and "to" values in
memory while we already have them available in registers. This also has impact,
especially on RISC processors. In the same spirit as the change done by
Eric Dumazet on csum_replace2(), this patch rewrites inet_proto_csum_replace4()
taking into account RFC1624.

I spotted during a NATted tcp transfert that csum_partial() is one of top 5
consuming functions (around 8%), and the second user of csum_partial() is
inet_proto_csum_replace4().

Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Acked-by: Eric Dumazet <edumazet@google.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
net/core/utils.c

index eed34338736c275aa02bfa40448801d46dda736b..efc76dd9dcd160aaf31a37454fc980fbb7e9d5b4 100644 (file)
@@ -306,16 +306,14 @@ EXPORT_SYMBOL(in6_pton);
 void inet_proto_csum_replace4(__sum16 *sum, struct sk_buff *skb,
                              __be32 from, __be32 to, int pseudohdr)
 {
-       __be32 diff[] = { ~from, to };
        if (skb->ip_summed != CHECKSUM_PARTIAL) {
-               *sum = csum_fold(csum_partial(diff, sizeof(diff),
-                               ~csum_unfold(*sum)));
+               *sum = csum_fold(csum_add(csum_sub(~csum_unfold(*sum), from),
+                                to));
                if (skb->ip_summed == CHECKSUM_COMPLETE && pseudohdr)
-                       skb->csum = ~csum_partial(diff, sizeof(diff),
-                                               ~skb->csum);
+                       skb->csum = ~csum_add(csum_sub(~(skb->csum), from), to);
        } else if (pseudohdr)
-               *sum = ~csum_fold(csum_partial(diff, sizeof(diff),
-                               csum_unfold(*sum)));
+               *sum = ~csum_fold(csum_add(csum_sub(csum_unfold(*sum), from),
+                                 to));
 }
 EXPORT_SYMBOL(inet_proto_csum_replace4);