Skip to content

Commit 8c72c65

Browse files
Eric Dumazetdavem330
authored andcommitted
tcp: update skb->skb_mstamp more carefully
liujian reported a problem in TCP_USER_TIMEOUT processing with a patch in tcp_probe_timer() : https://www.spinics.net/lists/netdev/msg454496.html After investigations, the root cause of the problem is that we update skb->skb_mstamp of skbs in write queue, even if the attempt to send a clone or copy of it failed. One reason being a routing problem. This patch prevents this, solving liujian issue. It also removes a potential RTT miscalculation, since __tcp_retransmit_skb() is not OR-ing TCP_SKB_CB(skb)->sacked with TCPCB_EVER_RETRANS if a failure happens, but skb->skb_mstamp has been changed. A future ACK would then lead to a very small RTT sample and min_rtt would then be lowered to this too small value. Tested: # cat user_timeout.pkt --local_ip=192.168.102.64 0 socket(..., SOCK_STREAM, IPPROTO_TCP) = 3 +0 setsockopt(3, SOL_SOCKET, SO_REUSEADDR, [1], 4) = 0 +0 bind(3, ..., ...) = 0 +0 listen(3, 1) = 0 +0 `ifconfig tun0 192.168.102.64/16; ip ro add 192.0.2.1 dev tun0` +0 < S 0:0(0) win 0 <mss 1460> +0 > S. 0:0(0) ack 1 <mss 1460> +.1 < . 1:1(0) ack 1 win 65530 +0 accept(3, ..., ...) = 4 +0 setsockopt(4, SOL_TCP, TCP_USER_TIMEOUT, [3000], 4) = 0 +0 write(4, ..., 24) = 24 +0 > P. 1:25(24) ack 1 win 29200 +.1 < . 1:1(0) ack 25 win 65530 //change the ipaddress +1 `ifconfig tun0 192.168.0.10/16` +1 write(4, ..., 24) = 24 +1 write(4, ..., 24) = 24 +1 write(4, ..., 24) = 24 +1 write(4, ..., 24) = 24 +0 `ifconfig tun0 192.168.102.64/16` +0 < . 1:2(1) ack 25 win 65530 +0 `ifconfig tun0 192.168.0.10/16` +3 write(4, ..., 24) = -1 # ./packetdrill user_timeout.pkt Signed-off-by: Eric Dumazet <[email protected]> Reported-by: liujian <[email protected]> Acked-by: Neal Cardwell <[email protected]> Acked-by: Yuchung Cheng <[email protected]> Acked-by: Soheil Hassas Yeganeh <[email protected]> Signed-off-by: David S. Miller <[email protected]>
1 parent cbea8f0 commit 8c72c65

File tree

1 file changed

+12
-7
lines changed

1 file changed

+12
-7
lines changed

net/ipv4/tcp_output.c

Lines changed: 12 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -991,26 +991,28 @@ static int tcp_transmit_skb(struct sock *sk, struct sk_buff *skb, int clone_it,
991991
struct tcp_skb_cb *tcb;
992992
struct tcp_out_options opts;
993993
unsigned int tcp_options_size, tcp_header_size;
994+
struct sk_buff *oskb = NULL;
994995
struct tcp_md5sig_key *md5;
995996
struct tcphdr *th;
996997
int err;
997998

998999
BUG_ON(!skb || !tcp_skb_pcount(skb));
9991000
tp = tcp_sk(sk);
10001001

1001-
skb->skb_mstamp = tp->tcp_mstamp;
10021002
if (clone_it) {
10031003
TCP_SKB_CB(skb)->tx.in_flight = TCP_SKB_CB(skb)->end_seq
10041004
- tp->snd_una;
10051005
tcp_rate_skb_sent(sk, skb);
10061006

1007+
oskb = skb;
10071008
if (unlikely(skb_cloned(skb)))
10081009
skb = pskb_copy(skb, gfp_mask);
10091010
else
10101011
skb = skb_clone(skb, gfp_mask);
10111012
if (unlikely(!skb))
10121013
return -ENOBUFS;
10131014
}
1015+
skb->skb_mstamp = tp->tcp_mstamp;
10141016

10151017
inet = inet_sk(sk);
10161018
tcb = TCP_SKB_CB(skb);
@@ -1122,12 +1124,14 @@ static int tcp_transmit_skb(struct sock *sk, struct sk_buff *skb, int clone_it,
11221124

11231125
err = icsk->icsk_af_ops->queue_xmit(sk, skb, &inet->cork.fl);
11241126

1125-
if (likely(err <= 0))
1126-
return err;
1127-
1128-
tcp_enter_cwr(sk);
1127+
if (unlikely(err > 0)) {
1128+
tcp_enter_cwr(sk);
1129+
err = net_xmit_eval(err);
1130+
}
1131+
if (!err && oskb)
1132+
oskb->skb_mstamp = tp->tcp_mstamp;
11291133

1130-
return net_xmit_eval(err);
1134+
return err;
11311135
}
11321136

11331137
/* This routine just queues the buffer for sending.
@@ -2869,10 +2873,11 @@ int __tcp_retransmit_skb(struct sock *sk, struct sk_buff *skb, int segs)
28692873
skb_headroom(skb) >= 0xFFFF)) {
28702874
struct sk_buff *nskb;
28712875

2872-
skb->skb_mstamp = tp->tcp_mstamp;
28732876
nskb = __pskb_copy(skb, MAX_TCP_HEADER, GFP_ATOMIC);
28742877
err = nskb ? tcp_transmit_skb(sk, nskb, 0, GFP_ATOMIC) :
28752878
-ENOBUFS;
2879+
if (!err)
2880+
skb->skb_mstamp = tp->tcp_mstamp;
28762881
} else {
28772882
err = tcp_transmit_skb(sk, skb, 1, GFP_ATOMIC);
28782883
}

0 commit comments

Comments
 (0)