udp: add batching to udp_rmem_release()
authorEric Dumazet <edumazet@google.com>
Thu, 8 Dec 2016 19:41:56 +0000 (11:41 -0800)
committerDavid S. Miller <davem@davemloft.net>
Sat, 10 Dec 2016 03:12:21 +0000 (22:12 -0500)
If udp_recvmsg() constantly releases sk_rmem_alloc
for every read packet, it gives opportunity for
producers to immediately grab spinlocks and desperatly
try adding another packet, causing false sharing.

We can add a simple heuristic to give the signal
by batches of ~25 % of the queue capacity.

This patch considerably increases performance under
flood by about 50 %, since the thread draining the queue
is no longer slowed by false sharing.

Signed-off-by: Eric Dumazet <edumazet@google.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
include/linux/udp.h
net/ipv4/udp.c

index d1fd8cd39478b635ef5396b5ae1c63f8c9658817..c0f530809d1f3db7323e51a52224eb49d8f97da0 100644 (file)
@@ -79,6 +79,9 @@ struct udp_sock {
        int                     (*gro_complete)(struct sock *sk,
                                                struct sk_buff *skb,
                                                int nhoff);
+
+       /* This field is dirtied by udp_recvmsg() */
+       int             forward_deficit;
 };
 
 static inline struct udp_sock *udp_sk(const struct sock *sk)
index c608334d99aa5620858d9cceec500b2be944e595..5a38faa12cde7fdcd5b6d86cdc0f4bc33de427bb 100644 (file)
@@ -1177,8 +1177,20 @@ out:
 /* fully reclaim rmem/fwd memory allocated for skb */
 static void udp_rmem_release(struct sock *sk, int size, int partial)
 {
+       struct udp_sock *up = udp_sk(sk);
        int amt;
 
+       if (likely(partial)) {
+               up->forward_deficit += size;
+               size = up->forward_deficit;
+               if (size < (sk->sk_rcvbuf >> 2) &&
+                   !skb_queue_empty(&sk->sk_receive_queue))
+                       return;
+       } else {
+               size += up->forward_deficit;
+       }
+       up->forward_deficit = 0;
+
        atomic_sub(size, &sk->sk_rmem_alloc);
        sk->sk_forward_alloc += size;
        amt = (sk->sk_forward_alloc - partial) & ~(SK_MEM_QUANTUM - 1);