tcp: be more careful in tcp_fragment()

author Eric Dumazet <edumazet@google.com>

Tue, 6 Aug 2019 15:09:14 +0000 (17:09 +0200)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Fri, 9 Aug 2019 15:53:32 +0000 (17:53 +0200)
author Eric Dumazet <edumazet@google.com>
Tue, 6 Aug 2019 15:09:14 +0000 (17:09 +0200)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Fri, 9 Aug 2019 15:53:32 +0000 (17:53 +0200)
diff --git a/include/net/tcp.h b/include/net/tcp.h

index 0b477a1e11770baf1e850df022542444736cf670..7994e569644e0c017d08c66484545de2a14002f4 100644 (file)
--- a/include/net/tcp.h
+++ b/include/net/tcp.h
@@ -1688,6 +1688,23 @@ static inline void tcp_check_send_head(struct sock *sk, struct sk_buff *skb_unli
                 tcp_sk(sk)->highest_sack = NULL;
  }
  
+static inline struct sk_buff *tcp_rtx_queue_head(const struct sock *sk)
+{
+       struct sk_buff *skb = tcp_write_queue_head(sk);
+
+       if (skb == tcp_send_head(sk))
+               skb = NULL;
+
+       return skb;
+}
+
+static inline struct sk_buff *tcp_rtx_queue_tail(const struct sock *sk)
+{
+       struct sk_buff *skb = tcp_send_head(sk);
+
+       return skb ? tcp_write_queue_prev(sk, skb) : tcp_write_queue_tail(sk);
+}
+
  static inline void __tcp_add_write_queue_tail(struct sock *sk, struct sk_buff *skb)
  {
         __skb_queue_tail(&sk->sk_write_queue, skb);
diff --git a/net/ipv4/tcp_output.c b/net/ipv4/tcp_output.c

index a5960b9b6741cd0c43e4235a667a7a831f8d66bd..a99086bf26eaf2d83c6f7a0c497f36787f150308 100644 (file)
--- a/net/ipv4/tcp_output.c
+++ b/net/ipv4/tcp_output.c
@@ -1264,6 +1264,7 @@ int tcp_fragment(struct sock *sk, struct sk_buff *skb, u32 len,
         struct tcp_sock *tp = tcp_sk(sk);
         struct sk_buff *buff;
         int nsize, old_factor;
+       long limit;
         int nlen;
         u8 flags;
  
@@ -1274,7 +1275,15 @@ int tcp_fragment(struct sock *sk, struct sk_buff *skb, u32 len,
         if (nsize < 0)
                 nsize = 0;
  
-       if (unlikely((sk->sk_wmem_queued >> 1) > sk->sk_sndbuf + 0x20000)) {
+       /* tcp_sendmsg() can overshoot sk_wmem_queued by one full size skb.
+        * We need some allowance to not penalize applications setting small
+        * SO_SNDBUF values.
+        * Also allow first and last skb in retransmit queue to be split.
+        */
+       limit = sk->sk_sndbuf + 2 * SKB_TRUESIZE(GSO_MAX_SIZE);
+       if (unlikely((sk->sk_wmem_queued >> 1) > limit &&
+                    skb != tcp_rtx_queue_head(sk) &&
+                    skb != tcp_rtx_queue_tail(sk))) {
                 NET_INC_STATS(sock_net(sk), LINUX_MIB_TCPWQUEUETOOBIG);
                 return -ENOMEM;
         }
author	Eric Dumazet <edumazet@google.com>
	Tue, 6 Aug 2019 15:09:14 +0000 (17:09 +0200)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Fri, 9 Aug 2019 15:53:32 +0000 (17:53 +0200)
include/net/tcp.h		patch \| blob \| blame \| history
net/ipv4/tcp_output.c		patch \| blob \| blame \| history