Commit 74e53a3a authored by Florian Westphal's avatar Florian Westphal Committed by Greg Kroah-Hartman

dctcp: avoid bogus doubling of cwnd after loss

[ Upstream commit ce6dd233 ]

If a congestion control module doesn't provide .undo_cwnd function,
tcp_undo_cwnd_reduction() will set cwnd to

   tp->snd_cwnd = max(tp->snd_cwnd, tp->snd_ssthresh << 1);

... which makes sense for reno (it sets ssthresh to half the current cwnd),
but it makes no sense for dctcp, which sets ssthresh based on the current
congestion estimate.

This can cause severe growth of cwnd (eventually overflowing u32).

Fix this by saving last cwnd on loss and restore cwnd based on that,
similar to cubic and other algorithms.

Fixes: e3118e83 ("net: tcp: add DCTCP congestion control algorithm")
Cc: Lawrence Brakmo <brakmo@fb.com>
Cc: Andrew Shewmaker <agshew@gmail.com>
Cc: Glenn Judd <glenn.judd@morganstanley.com>
Acked-by: default avatarDaniel Borkmann <daniel@iogearbox.net>
Signed-off-by: default avatarFlorian Westphal <fw@strlen.de>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
Signed-off-by: default avatarGreg Kroah-Hartman <gregkh@linuxfoundation.org>
parent 86429bd4
...@@ -56,6 +56,7 @@ struct dctcp { ...@@ -56,6 +56,7 @@ struct dctcp {
u32 next_seq; u32 next_seq;
u32 ce_state; u32 ce_state;
u32 delayed_ack_reserved; u32 delayed_ack_reserved;
u32 loss_cwnd;
}; };
static unsigned int dctcp_shift_g __read_mostly = 4; /* g = 1/2^4 */ static unsigned int dctcp_shift_g __read_mostly = 4; /* g = 1/2^4 */
...@@ -96,6 +97,7 @@ static void dctcp_init(struct sock *sk) ...@@ -96,6 +97,7 @@ static void dctcp_init(struct sock *sk)
ca->dctcp_alpha = min(dctcp_alpha_on_init, DCTCP_MAX_ALPHA); ca->dctcp_alpha = min(dctcp_alpha_on_init, DCTCP_MAX_ALPHA);
ca->delayed_ack_reserved = 0; ca->delayed_ack_reserved = 0;
ca->loss_cwnd = 0;
ca->ce_state = 0; ca->ce_state = 0;
dctcp_reset(tp, ca); dctcp_reset(tp, ca);
...@@ -111,9 +113,10 @@ static void dctcp_init(struct sock *sk) ...@@ -111,9 +113,10 @@ static void dctcp_init(struct sock *sk)
static u32 dctcp_ssthresh(struct sock *sk) static u32 dctcp_ssthresh(struct sock *sk)
{ {
const struct dctcp *ca = inet_csk_ca(sk); struct dctcp *ca = inet_csk_ca(sk);
struct tcp_sock *tp = tcp_sk(sk); struct tcp_sock *tp = tcp_sk(sk);
ca->loss_cwnd = tp->snd_cwnd;
return max(tp->snd_cwnd - ((tp->snd_cwnd * ca->dctcp_alpha) >> 11U), 2U); return max(tp->snd_cwnd - ((tp->snd_cwnd * ca->dctcp_alpha) >> 11U), 2U);
} }
...@@ -308,12 +311,20 @@ static size_t dctcp_get_info(struct sock *sk, u32 ext, int *attr, ...@@ -308,12 +311,20 @@ static size_t dctcp_get_info(struct sock *sk, u32 ext, int *attr,
return 0; return 0;
} }
static u32 dctcp_cwnd_undo(struct sock *sk)
{
const struct dctcp *ca = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, ca->loss_cwnd);
}
static struct tcp_congestion_ops dctcp __read_mostly = { static struct tcp_congestion_ops dctcp __read_mostly = {
.init = dctcp_init, .init = dctcp_init,
.in_ack_event = dctcp_update_alpha, .in_ack_event = dctcp_update_alpha,
.cwnd_event = dctcp_cwnd_event, .cwnd_event = dctcp_cwnd_event,
.ssthresh = dctcp_ssthresh, .ssthresh = dctcp_ssthresh,
.cong_avoid = tcp_reno_cong_avoid, .cong_avoid = tcp_reno_cong_avoid,
.undo_cwnd = dctcp_cwnd_undo,
.set_state = dctcp_state, .set_state = dctcp_state,
.get_info = dctcp_get_info, .get_info = dctcp_get_info,
.flags = TCP_CONG_NEEDS_ECN, .flags = TCP_CONG_NEEDS_ECN,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment