Commit 9e36ced6 authored by David S. Miller's avatar David S. Miller

Merge branch 'tcp-cong-undo_cwnd-mandatory'

Florian Westphal says:

====================
tcp: make undo_cwnd mandatory for congestion modules

highspeed, illinois, scalable, veno and yeah congestion control algorithms
don't provide a 'cwnd_undo' function.  This makes the stack default to a
'reno undo' which doubles cwnd.  However, the ssthresh implementation of
these algorithms do not halve the slowstart threshold. This causes similar
issue as the one fixed for dctcp in ce6dd233 ("dctcp: avoid bogus
doubling of cwnd after loss").

In light of this it seems better to remove the fallback and make undo_cwnd
mandatory.

First patch fixes those spots where reno undo seems incorrect by providing
.cwnd_undo functions, second patch removes the fallback.
====================
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parents 2fcb58ab e9799183
...@@ -958,6 +958,7 @@ u32 tcp_slow_start(struct tcp_sock *tp, u32 acked); ...@@ -958,6 +958,7 @@ u32 tcp_slow_start(struct tcp_sock *tp, u32 acked);
void tcp_cong_avoid_ai(struct tcp_sock *tp, u32 w, u32 acked); void tcp_cong_avoid_ai(struct tcp_sock *tp, u32 w, u32 acked);
u32 tcp_reno_ssthresh(struct sock *sk); u32 tcp_reno_ssthresh(struct sock *sk);
u32 tcp_reno_undo_cwnd(struct sock *sk);
void tcp_reno_cong_avoid(struct sock *sk, u32 ack, u32 acked); void tcp_reno_cong_avoid(struct sock *sk, u32 ack, u32 acked);
extern struct tcp_congestion_ops tcp_reno; extern struct tcp_congestion_ops tcp_reno;
......
...@@ -68,8 +68,9 @@ int tcp_register_congestion_control(struct tcp_congestion_ops *ca) ...@@ -68,8 +68,9 @@ int tcp_register_congestion_control(struct tcp_congestion_ops *ca)
{ {
int ret = 0; int ret = 0;
/* all algorithms must implement ssthresh and cong_avoid ops */ /* all algorithms must implement these */
if (!ca->ssthresh || !(ca->cong_avoid || ca->cong_control)) { if (!ca->ssthresh || !ca->undo_cwnd ||
!(ca->cong_avoid || ca->cong_control)) {
pr_err("%s does not implement required ops\n", ca->name); pr_err("%s does not implement required ops\n", ca->name);
return -EINVAL; return -EINVAL;
} }
...@@ -441,10 +442,19 @@ u32 tcp_reno_ssthresh(struct sock *sk) ...@@ -441,10 +442,19 @@ u32 tcp_reno_ssthresh(struct sock *sk)
} }
EXPORT_SYMBOL_GPL(tcp_reno_ssthresh); EXPORT_SYMBOL_GPL(tcp_reno_ssthresh);
u32 tcp_reno_undo_cwnd(struct sock *sk)
{
const struct tcp_sock *tp = tcp_sk(sk);
return max(tp->snd_cwnd, tp->snd_ssthresh << 1);
}
EXPORT_SYMBOL_GPL(tcp_reno_undo_cwnd);
struct tcp_congestion_ops tcp_reno = { struct tcp_congestion_ops tcp_reno = {
.flags = TCP_CONG_NON_RESTRICTED, .flags = TCP_CONG_NON_RESTRICTED,
.name = "reno", .name = "reno",
.owner = THIS_MODULE, .owner = THIS_MODULE,
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.cong_avoid = tcp_reno_cong_avoid, .cong_avoid = tcp_reno_cong_avoid,
.undo_cwnd = tcp_reno_undo_cwnd,
}; };
...@@ -342,6 +342,7 @@ static struct tcp_congestion_ops dctcp __read_mostly = { ...@@ -342,6 +342,7 @@ static struct tcp_congestion_ops dctcp __read_mostly = {
static struct tcp_congestion_ops dctcp_reno __read_mostly = { static struct tcp_congestion_ops dctcp_reno __read_mostly = {
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.cong_avoid = tcp_reno_cong_avoid, .cong_avoid = tcp_reno_cong_avoid,
.undo_cwnd = tcp_reno_undo_cwnd,
.get_info = dctcp_get_info, .get_info = dctcp_get_info,
.owner = THIS_MODULE, .owner = THIS_MODULE,
.name = "dctcp-reno", .name = "dctcp-reno",
......
...@@ -94,6 +94,7 @@ static const struct hstcp_aimd_val { ...@@ -94,6 +94,7 @@ static const struct hstcp_aimd_val {
struct hstcp { struct hstcp {
u32 ai; u32 ai;
u32 loss_cwnd;
}; };
static void hstcp_init(struct sock *sk) static void hstcp_init(struct sock *sk)
...@@ -150,16 +151,24 @@ static void hstcp_cong_avoid(struct sock *sk, u32 ack, u32 acked) ...@@ -150,16 +151,24 @@ static void hstcp_cong_avoid(struct sock *sk, u32 ack, u32 acked)
static u32 hstcp_ssthresh(struct sock *sk) static u32 hstcp_ssthresh(struct sock *sk)
{ {
const struct tcp_sock *tp = tcp_sk(sk); const struct tcp_sock *tp = tcp_sk(sk);
const struct hstcp *ca = inet_csk_ca(sk); struct hstcp *ca = inet_csk_ca(sk);
ca->loss_cwnd = tp->snd_cwnd;
/* Do multiplicative decrease */ /* Do multiplicative decrease */
return max(tp->snd_cwnd - ((tp->snd_cwnd * hstcp_aimd_vals[ca->ai].md) >> 8), 2U); return max(tp->snd_cwnd - ((tp->snd_cwnd * hstcp_aimd_vals[ca->ai].md) >> 8), 2U);
} }
static u32 hstcp_cwnd_undo(struct sock *sk)
{
const struct hstcp *ca = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, ca->loss_cwnd);
}
static struct tcp_congestion_ops tcp_highspeed __read_mostly = { static struct tcp_congestion_ops tcp_highspeed __read_mostly = {
.init = hstcp_init, .init = hstcp_init,
.ssthresh = hstcp_ssthresh, .ssthresh = hstcp_ssthresh,
.undo_cwnd = hstcp_cwnd_undo,
.cong_avoid = hstcp_cong_avoid, .cong_avoid = hstcp_cong_avoid,
.owner = THIS_MODULE, .owner = THIS_MODULE,
......
...@@ -166,6 +166,7 @@ static void hybla_cong_avoid(struct sock *sk, u32 ack, u32 acked) ...@@ -166,6 +166,7 @@ static void hybla_cong_avoid(struct sock *sk, u32 ack, u32 acked)
static struct tcp_congestion_ops tcp_hybla __read_mostly = { static struct tcp_congestion_ops tcp_hybla __read_mostly = {
.init = hybla_init, .init = hybla_init,
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.undo_cwnd = tcp_reno_undo_cwnd,
.cong_avoid = hybla_cong_avoid, .cong_avoid = hybla_cong_avoid,
.set_state = hybla_state, .set_state = hybla_state,
......
...@@ -48,6 +48,7 @@ struct illinois { ...@@ -48,6 +48,7 @@ struct illinois {
u32 end_seq; /* right edge of current RTT */ u32 end_seq; /* right edge of current RTT */
u32 alpha; /* Additive increase */ u32 alpha; /* Additive increase */
u32 beta; /* Muliplicative decrease */ u32 beta; /* Muliplicative decrease */
u32 loss_cwnd; /* cwnd on loss */
u16 acked; /* # packets acked by current ACK */ u16 acked; /* # packets acked by current ACK */
u8 rtt_above; /* average rtt has gone above threshold */ u8 rtt_above; /* average rtt has gone above threshold */
u8 rtt_low; /* # of rtts measurements below threshold */ u8 rtt_low; /* # of rtts measurements below threshold */
...@@ -296,10 +297,18 @@ static u32 tcp_illinois_ssthresh(struct sock *sk) ...@@ -296,10 +297,18 @@ static u32 tcp_illinois_ssthresh(struct sock *sk)
struct tcp_sock *tp = tcp_sk(sk); struct tcp_sock *tp = tcp_sk(sk);
struct illinois *ca = inet_csk_ca(sk); struct illinois *ca = inet_csk_ca(sk);
ca->loss_cwnd = tp->snd_cwnd;
/* Multiplicative decrease */ /* Multiplicative decrease */
return max(tp->snd_cwnd - ((tp->snd_cwnd * ca->beta) >> BETA_SHIFT), 2U); return max(tp->snd_cwnd - ((tp->snd_cwnd * ca->beta) >> BETA_SHIFT), 2U);
} }
static u32 tcp_illinois_cwnd_undo(struct sock *sk)
{
const struct illinois *ca = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, ca->loss_cwnd);
}
/* Extract info for Tcp socket info provided via netlink. */ /* Extract info for Tcp socket info provided via netlink. */
static size_t tcp_illinois_info(struct sock *sk, u32 ext, int *attr, static size_t tcp_illinois_info(struct sock *sk, u32 ext, int *attr,
union tcp_cc_info *info) union tcp_cc_info *info)
...@@ -327,6 +336,7 @@ static size_t tcp_illinois_info(struct sock *sk, u32 ext, int *attr, ...@@ -327,6 +336,7 @@ static size_t tcp_illinois_info(struct sock *sk, u32 ext, int *attr,
static struct tcp_congestion_ops tcp_illinois __read_mostly = { static struct tcp_congestion_ops tcp_illinois __read_mostly = {
.init = tcp_illinois_init, .init = tcp_illinois_init,
.ssthresh = tcp_illinois_ssthresh, .ssthresh = tcp_illinois_ssthresh,
.undo_cwnd = tcp_illinois_cwnd_undo,
.cong_avoid = tcp_illinois_cong_avoid, .cong_avoid = tcp_illinois_cong_avoid,
.set_state = tcp_illinois_state, .set_state = tcp_illinois_state,
.get_info = tcp_illinois_info, .get_info = tcp_illinois_info,
......
...@@ -2394,10 +2394,7 @@ static void tcp_undo_cwnd_reduction(struct sock *sk, bool unmark_loss) ...@@ -2394,10 +2394,7 @@ static void tcp_undo_cwnd_reduction(struct sock *sk, bool unmark_loss)
if (tp->prior_ssthresh) { if (tp->prior_ssthresh) {
const struct inet_connection_sock *icsk = inet_csk(sk); const struct inet_connection_sock *icsk = inet_csk(sk);
if (icsk->icsk_ca_ops->undo_cwnd)
tp->snd_cwnd = icsk->icsk_ca_ops->undo_cwnd(sk); tp->snd_cwnd = icsk->icsk_ca_ops->undo_cwnd(sk);
else
tp->snd_cwnd = max(tp->snd_cwnd, tp->snd_ssthresh << 1);
if (tp->prior_ssthresh > tp->snd_ssthresh) { if (tp->prior_ssthresh > tp->snd_ssthresh) {
tp->snd_ssthresh = tp->prior_ssthresh; tp->snd_ssthresh = tp->prior_ssthresh;
......
...@@ -316,6 +316,7 @@ static void tcp_lp_pkts_acked(struct sock *sk, const struct ack_sample *sample) ...@@ -316,6 +316,7 @@ static void tcp_lp_pkts_acked(struct sock *sk, const struct ack_sample *sample)
static struct tcp_congestion_ops tcp_lp __read_mostly = { static struct tcp_congestion_ops tcp_lp __read_mostly = {
.init = tcp_lp_init, .init = tcp_lp_init,
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.undo_cwnd = tcp_reno_undo_cwnd,
.cong_avoid = tcp_lp_cong_avoid, .cong_avoid = tcp_lp_cong_avoid,
.pkts_acked = tcp_lp_pkts_acked, .pkts_acked = tcp_lp_pkts_acked,
......
...@@ -15,6 +15,10 @@ ...@@ -15,6 +15,10 @@
#define TCP_SCALABLE_AI_CNT 50U #define TCP_SCALABLE_AI_CNT 50U
#define TCP_SCALABLE_MD_SCALE 3 #define TCP_SCALABLE_MD_SCALE 3
struct scalable {
u32 loss_cwnd;
};
static void tcp_scalable_cong_avoid(struct sock *sk, u32 ack, u32 acked) static void tcp_scalable_cong_avoid(struct sock *sk, u32 ack, u32 acked)
{ {
struct tcp_sock *tp = tcp_sk(sk); struct tcp_sock *tp = tcp_sk(sk);
...@@ -32,12 +36,23 @@ static void tcp_scalable_cong_avoid(struct sock *sk, u32 ack, u32 acked) ...@@ -32,12 +36,23 @@ static void tcp_scalable_cong_avoid(struct sock *sk, u32 ack, u32 acked)
static u32 tcp_scalable_ssthresh(struct sock *sk) static u32 tcp_scalable_ssthresh(struct sock *sk)
{ {
const struct tcp_sock *tp = tcp_sk(sk); const struct tcp_sock *tp = tcp_sk(sk);
struct scalable *ca = inet_csk_ca(sk);
ca->loss_cwnd = tp->snd_cwnd;
return max(tp->snd_cwnd - (tp->snd_cwnd>>TCP_SCALABLE_MD_SCALE), 2U); return max(tp->snd_cwnd - (tp->snd_cwnd>>TCP_SCALABLE_MD_SCALE), 2U);
} }
static u32 tcp_scalable_cwnd_undo(struct sock *sk)
{
const struct scalable *ca = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, ca->loss_cwnd);
}
static struct tcp_congestion_ops tcp_scalable __read_mostly = { static struct tcp_congestion_ops tcp_scalable __read_mostly = {
.ssthresh = tcp_scalable_ssthresh, .ssthresh = tcp_scalable_ssthresh,
.undo_cwnd = tcp_scalable_cwnd_undo,
.cong_avoid = tcp_scalable_cong_avoid, .cong_avoid = tcp_scalable_cong_avoid,
.owner = THIS_MODULE, .owner = THIS_MODULE,
......
...@@ -307,6 +307,7 @@ EXPORT_SYMBOL_GPL(tcp_vegas_get_info); ...@@ -307,6 +307,7 @@ EXPORT_SYMBOL_GPL(tcp_vegas_get_info);
static struct tcp_congestion_ops tcp_vegas __read_mostly = { static struct tcp_congestion_ops tcp_vegas __read_mostly = {
.init = tcp_vegas_init, .init = tcp_vegas_init,
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.undo_cwnd = tcp_reno_undo_cwnd,
.cong_avoid = tcp_vegas_cong_avoid, .cong_avoid = tcp_vegas_cong_avoid,
.pkts_acked = tcp_vegas_pkts_acked, .pkts_acked = tcp_vegas_pkts_acked,
.set_state = tcp_vegas_state, .set_state = tcp_vegas_state,
......
...@@ -30,6 +30,7 @@ struct veno { ...@@ -30,6 +30,7 @@ struct veno {
u32 basertt; /* the min of all Veno rtt measurements seen (in usec) */ u32 basertt; /* the min of all Veno rtt measurements seen (in usec) */
u32 inc; /* decide whether to increase cwnd */ u32 inc; /* decide whether to increase cwnd */
u32 diff; /* calculate the diff rate */ u32 diff; /* calculate the diff rate */
u32 loss_cwnd; /* cwnd when loss occured */
}; };
/* There are several situations when we must "re-start" Veno: /* There are several situations when we must "re-start" Veno:
...@@ -193,6 +194,7 @@ static u32 tcp_veno_ssthresh(struct sock *sk) ...@@ -193,6 +194,7 @@ static u32 tcp_veno_ssthresh(struct sock *sk)
const struct tcp_sock *tp = tcp_sk(sk); const struct tcp_sock *tp = tcp_sk(sk);
struct veno *veno = inet_csk_ca(sk); struct veno *veno = inet_csk_ca(sk);
veno->loss_cwnd = tp->snd_cwnd;
if (veno->diff < beta) if (veno->diff < beta)
/* in "non-congestive state", cut cwnd by 1/5 */ /* in "non-congestive state", cut cwnd by 1/5 */
return max(tp->snd_cwnd * 4 / 5, 2U); return max(tp->snd_cwnd * 4 / 5, 2U);
...@@ -201,9 +203,17 @@ static u32 tcp_veno_ssthresh(struct sock *sk) ...@@ -201,9 +203,17 @@ static u32 tcp_veno_ssthresh(struct sock *sk)
return max(tp->snd_cwnd >> 1U, 2U); return max(tp->snd_cwnd >> 1U, 2U);
} }
static u32 tcp_veno_cwnd_undo(struct sock *sk)
{
const struct veno *veno = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, veno->loss_cwnd);
}
static struct tcp_congestion_ops tcp_veno __read_mostly = { static struct tcp_congestion_ops tcp_veno __read_mostly = {
.init = tcp_veno_init, .init = tcp_veno_init,
.ssthresh = tcp_veno_ssthresh, .ssthresh = tcp_veno_ssthresh,
.undo_cwnd = tcp_veno_cwnd_undo,
.cong_avoid = tcp_veno_cong_avoid, .cong_avoid = tcp_veno_cong_avoid,
.pkts_acked = tcp_veno_pkts_acked, .pkts_acked = tcp_veno_pkts_acked,
.set_state = tcp_veno_state, .set_state = tcp_veno_state,
......
...@@ -278,6 +278,7 @@ static struct tcp_congestion_ops tcp_westwood __read_mostly = { ...@@ -278,6 +278,7 @@ static struct tcp_congestion_ops tcp_westwood __read_mostly = {
.init = tcp_westwood_init, .init = tcp_westwood_init,
.ssthresh = tcp_reno_ssthresh, .ssthresh = tcp_reno_ssthresh,
.cong_avoid = tcp_reno_cong_avoid, .cong_avoid = tcp_reno_cong_avoid,
.undo_cwnd = tcp_reno_undo_cwnd,
.cwnd_event = tcp_westwood_event, .cwnd_event = tcp_westwood_event,
.in_ack_event = tcp_westwood_ack, .in_ack_event = tcp_westwood_ack,
.get_info = tcp_westwood_info, .get_info = tcp_westwood_info,
......
...@@ -37,6 +37,7 @@ struct yeah { ...@@ -37,6 +37,7 @@ struct yeah {
u32 fast_count; u32 fast_count;
u32 pkts_acked; u32 pkts_acked;
u32 loss_cwnd;
}; };
static void tcp_yeah_init(struct sock *sk) static void tcp_yeah_init(struct sock *sk)
...@@ -219,13 +220,22 @@ static u32 tcp_yeah_ssthresh(struct sock *sk) ...@@ -219,13 +220,22 @@ static u32 tcp_yeah_ssthresh(struct sock *sk)
yeah->fast_count = 0; yeah->fast_count = 0;
yeah->reno_count = max(yeah->reno_count>>1, 2U); yeah->reno_count = max(yeah->reno_count>>1, 2U);
yeah->loss_cwnd = tp->snd_cwnd;
return max_t(int, tp->snd_cwnd - reduction, 2); return max_t(int, tp->snd_cwnd - reduction, 2);
} }
static u32 tcp_yeah_cwnd_undo(struct sock *sk)
{
const struct yeah *yeah = inet_csk_ca(sk);
return max(tcp_sk(sk)->snd_cwnd, yeah->loss_cwnd);
}
static struct tcp_congestion_ops tcp_yeah __read_mostly = { static struct tcp_congestion_ops tcp_yeah __read_mostly = {
.init = tcp_yeah_init, .init = tcp_yeah_init,
.ssthresh = tcp_yeah_ssthresh, .ssthresh = tcp_yeah_ssthresh,
.undo_cwnd = tcp_yeah_cwnd_undo,
.cong_avoid = tcp_yeah_cong_avoid, .cong_avoid = tcp_yeah_cong_avoid,
.set_state = tcp_vegas_state, .set_state = tcp_vegas_state,
.cwnd_event = tcp_vegas_cwnd_event, .cwnd_event = tcp_vegas_cwnd_event,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment