Commit b081f85c authored by Eric Dumazet's avatar Eric Dumazet Committed by David S. Miller

net: implement tcp coalescing in tcp_queue_rcv()

Extend tcp coalescing implementing it from tcp_queue_rcv(), the main
receiver function when application is not blocked in recvmsg().

Function tcp_queue_rcv() is moved a bit to allow its call from
tcp_data_queue()

This gives good results especially if GRO could not kick, and if skb
head is a fragment.
Signed-off-by: default avatarEric Dumazet <edumazet@google.com>
Cc: Alexander Duyck <alexander.h.duyck@intel.com>
Cc: Neal Cardwell <ncardwell@google.com>
Cc: Tom Herbert <therbert@google.com>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent 923dd347
...@@ -439,7 +439,8 @@ extern int tcp_disconnect(struct sock *sk, int flags); ...@@ -439,7 +439,8 @@ extern int tcp_disconnect(struct sock *sk, int flags);
void tcp_connect_init(struct sock *sk); void tcp_connect_init(struct sock *sk);
void tcp_finish_connect(struct sock *sk, struct sk_buff *skb); void tcp_finish_connect(struct sock *sk, struct sk_buff *skb);
void tcp_queue_rcv(struct sock *sk, struct sk_buff *skb, int hdrlen); int __must_check tcp_queue_rcv(struct sock *sk, struct sk_buff *skb,
int hdrlen, bool *fragstolen);
/* From syncookies.c */ /* From syncookies.c */
extern __u32 syncookie_secret[2][16-4+SHA_DIGEST_WORDS]; extern __u32 syncookie_secret[2][16-4+SHA_DIGEST_WORDS];
......
...@@ -981,8 +981,8 @@ static inline int select_size(const struct sock *sk, bool sg) ...@@ -981,8 +981,8 @@ static inline int select_size(const struct sock *sk, bool sg)
static int tcp_send_rcvq(struct sock *sk, struct msghdr *msg, size_t size) static int tcp_send_rcvq(struct sock *sk, struct msghdr *msg, size_t size)
{ {
struct sk_buff *skb; struct sk_buff *skb;
struct tcp_skb_cb *cb;
struct tcphdr *th; struct tcphdr *th;
bool fragstolen;
skb = alloc_skb(size + sizeof(*th), sk->sk_allocation); skb = alloc_skb(size + sizeof(*th), sk->sk_allocation);
if (!skb) if (!skb)
...@@ -995,14 +995,14 @@ static int tcp_send_rcvq(struct sock *sk, struct msghdr *msg, size_t size) ...@@ -995,14 +995,14 @@ static int tcp_send_rcvq(struct sock *sk, struct msghdr *msg, size_t size)
if (memcpy_fromiovec(skb_put(skb, size), msg->msg_iov, size)) if (memcpy_fromiovec(skb_put(skb, size), msg->msg_iov, size))
goto err_free; goto err_free;
cb = TCP_SKB_CB(skb);
TCP_SKB_CB(skb)->seq = tcp_sk(sk)->rcv_nxt; TCP_SKB_CB(skb)->seq = tcp_sk(sk)->rcv_nxt;
TCP_SKB_CB(skb)->end_seq = TCP_SKB_CB(skb)->seq + size; TCP_SKB_CB(skb)->end_seq = TCP_SKB_CB(skb)->seq + size;
TCP_SKB_CB(skb)->ack_seq = tcp_sk(sk)->snd_una - 1; TCP_SKB_CB(skb)->ack_seq = tcp_sk(sk)->snd_una - 1;
tcp_queue_rcv(sk, skb, sizeof(*th)); if (tcp_queue_rcv(sk, skb, sizeof(*th), &fragstolen)) {
WARN_ON_ONCE(fragstolen); /* should not happen */
__kfree_skb(skb);
}
return size; return size;
err_free: err_free:
......
...@@ -4739,6 +4739,22 @@ static void tcp_data_queue_ofo(struct sock *sk, struct sk_buff *skb) ...@@ -4739,6 +4739,22 @@ static void tcp_data_queue_ofo(struct sock *sk, struct sk_buff *skb)
skb_set_owner_r(skb, sk); skb_set_owner_r(skb, sk);
} }
int tcp_queue_rcv(struct sock *sk, struct sk_buff *skb, int hdrlen,
bool *fragstolen)
{
int eaten;
struct sk_buff *tail = skb_peek_tail(&sk->sk_receive_queue);
__skb_pull(skb, hdrlen);
eaten = (tail &&
tcp_try_coalesce(sk, tail, skb, fragstolen)) ? 1 : 0;
tcp_sk(sk)->rcv_nxt = TCP_SKB_CB(skb)->end_seq;
if (!eaten) {
__skb_queue_tail(&sk->sk_receive_queue, skb);
skb_set_owner_r(skb, sk);
}
return eaten;
}
static void tcp_data_queue(struct sock *sk, struct sk_buff *skb) static void tcp_data_queue(struct sock *sk, struct sk_buff *skb)
{ {
...@@ -4785,20 +4801,12 @@ static void tcp_data_queue(struct sock *sk, struct sk_buff *skb) ...@@ -4785,20 +4801,12 @@ static void tcp_data_queue(struct sock *sk, struct sk_buff *skb)
} }
if (eaten <= 0) { if (eaten <= 0) {
struct sk_buff *tail;
queue_and_out: queue_and_out:
if (eaten < 0 && if (eaten < 0 &&
tcp_try_rmem_schedule(sk, skb->truesize)) tcp_try_rmem_schedule(sk, skb->truesize))
goto drop; goto drop;
tail = skb_peek_tail(&sk->sk_receive_queue); eaten = tcp_queue_rcv(sk, skb, 0, &fragstolen);
eaten = (tail &&
tcp_try_coalesce(sk, tail, skb,
&fragstolen)) ? 1 : 0;
if (eaten <= 0) {
skb_set_owner_r(skb, sk);
__skb_queue_tail(&sk->sk_receive_queue, skb);
}
} }
tp->rcv_nxt = TCP_SKB_CB(skb)->end_seq; tp->rcv_nxt = TCP_SKB_CB(skb)->end_seq;
if (skb->len) if (skb->len)
...@@ -5493,14 +5501,6 @@ static int tcp_validate_incoming(struct sock *sk, struct sk_buff *skb, ...@@ -5493,14 +5501,6 @@ static int tcp_validate_incoming(struct sock *sk, struct sk_buff *skb,
return 0; return 0;
} }
void tcp_queue_rcv(struct sock *sk, struct sk_buff *skb, int hdrlen)
{
__skb_pull(skb, hdrlen);
__skb_queue_tail(&sk->sk_receive_queue, skb);
skb_set_owner_r(skb, sk);
tcp_sk(sk)->rcv_nxt = TCP_SKB_CB(skb)->end_seq;
}
/* /*
* TCP receive function for the ESTABLISHED state. * TCP receive function for the ESTABLISHED state.
* *
...@@ -5609,6 +5609,7 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb, ...@@ -5609,6 +5609,7 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb,
} else { } else {
int eaten = 0; int eaten = 0;
int copied_early = 0; int copied_early = 0;
bool fragstolen = false;
if (tp->copied_seq == tp->rcv_nxt && if (tp->copied_seq == tp->rcv_nxt &&
len - tcp_header_len <= tp->ucopy.len) { len - tcp_header_len <= tp->ucopy.len) {
...@@ -5666,7 +5667,8 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb, ...@@ -5666,7 +5667,8 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb,
NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPHPHITS); NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPHPHITS);
/* Bulk data transfer: receiver */ /* Bulk data transfer: receiver */
tcp_queue_rcv(sk, skb, tcp_header_len); eaten = tcp_queue_rcv(sk, skb, tcp_header_len,
&fragstolen);
} }
tcp_event_data_recv(sk, skb); tcp_event_data_recv(sk, skb);
...@@ -5688,7 +5690,7 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb, ...@@ -5688,7 +5690,7 @@ int tcp_rcv_established(struct sock *sk, struct sk_buff *skb,
else else
#endif #endif
if (eaten) if (eaten)
__kfree_skb(skb); kfree_skb_partial(skb, fragstolen);
else else
sk->sk_data_ready(sk, 0); sk->sk_data_ready(sk, 0);
return 0; return 0;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment