Commit f3fafbcb authored by David S. Miller's avatar David S. Miller

Merge branch 'L4S-style-ce_threshold_ect1-marking'

Eric Dumazet says:

====================
net/sched: implement L4S style ce_threshold_ect1 marking

As suggested by Ingemar Johansson, Neal Cardwell, and others, fq_codel can be used
for Low Latency, Low Loss, Scalable Throughput (L4S) with a small change.

In ce_threshold_ect1 mode, only ECT(1) packets can be marked to CE if
their sojourn time is above the threshold.
====================
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parents 19757ceb e72aeb9e
...@@ -102,6 +102,7 @@ static inline u32 codel_time_to_us(codel_time_t val) ...@@ -102,6 +102,7 @@ static inline u32 codel_time_to_us(codel_time_t val)
* @interval: width of moving time window * @interval: width of moving time window
* @mtu: device mtu, or minimal queue backlog in bytes. * @mtu: device mtu, or minimal queue backlog in bytes.
* @ecn: is Explicit Congestion Notification enabled * @ecn: is Explicit Congestion Notification enabled
* @ce_threshold_ect1: if ce_threshold only marks ECT(1) packets
*/ */
struct codel_params { struct codel_params {
codel_time_t target; codel_time_t target;
...@@ -109,6 +110,7 @@ struct codel_params { ...@@ -109,6 +110,7 @@ struct codel_params {
codel_time_t interval; codel_time_t interval;
u32 mtu; u32 mtu;
bool ecn; bool ecn;
bool ce_threshold_ect1;
}; };
/** /**
......
...@@ -54,6 +54,7 @@ static void codel_params_init(struct codel_params *params) ...@@ -54,6 +54,7 @@ static void codel_params_init(struct codel_params *params)
params->interval = MS2TIME(100); params->interval = MS2TIME(100);
params->target = MS2TIME(5); params->target = MS2TIME(5);
params->ce_threshold = CODEL_DISABLED_THRESHOLD; params->ce_threshold = CODEL_DISABLED_THRESHOLD;
params->ce_threshold_ect1 = false;
params->ecn = false; params->ecn = false;
} }
...@@ -246,9 +247,20 @@ static struct sk_buff *codel_dequeue(void *ctx, ...@@ -246,9 +247,20 @@ static struct sk_buff *codel_dequeue(void *ctx,
vars->rec_inv_sqrt); vars->rec_inv_sqrt);
} }
end: end:
if (skb && codel_time_after(vars->ldelay, params->ce_threshold) && if (skb && codel_time_after(vars->ldelay, params->ce_threshold)) {
INET_ECN_set_ce(skb)) bool set_ce = true;
stats->ce_mark++;
if (params->ce_threshold_ect1) {
/* Note: if skb_get_dsfield() returns -1, following
* gives INET_ECN_MASK, which is != INET_ECN_ECT_1.
*/
u8 ecn = skb_get_dsfield(skb) & INET_ECN_MASK;
set_ce = (ecn == INET_ECN_ECT_1);
}
if (set_ce && INET_ECN_set_ce(skb))
stats->ce_mark++;
}
return skb; return skb;
} }
......
...@@ -188,6 +188,23 @@ static inline int INET_ECN_set_ce(struct sk_buff *skb) ...@@ -188,6 +188,23 @@ static inline int INET_ECN_set_ce(struct sk_buff *skb)
return 0; return 0;
} }
static inline int skb_get_dsfield(struct sk_buff *skb)
{
switch (skb_protocol(skb, true)) {
case cpu_to_be16(ETH_P_IP):
if (!pskb_network_may_pull(skb, sizeof(struct iphdr)))
break;
return ipv4_get_dsfield(ip_hdr(skb));
case cpu_to_be16(ETH_P_IPV6):
if (!pskb_network_may_pull(skb, sizeof(struct ipv6hdr)))
break;
return ipv6_get_dsfield(ipv6_hdr(skb));
}
return -1;
}
static inline int INET_ECN_set_ect1(struct sk_buff *skb) static inline int INET_ECN_set_ect1(struct sk_buff *skb)
{ {
switch (skb_protocol(skb, true)) { switch (skb_protocol(skb, true)) {
......
...@@ -840,6 +840,7 @@ enum { ...@@ -840,6 +840,7 @@ enum {
TCA_FQ_CODEL_CE_THRESHOLD, TCA_FQ_CODEL_CE_THRESHOLD,
TCA_FQ_CODEL_DROP_BATCH_SIZE, TCA_FQ_CODEL_DROP_BATCH_SIZE,
TCA_FQ_CODEL_MEMORY_LIMIT, TCA_FQ_CODEL_MEMORY_LIMIT,
TCA_FQ_CODEL_CE_THRESHOLD_ECT1,
__TCA_FQ_CODEL_MAX __TCA_FQ_CODEL_MAX
}; };
......
...@@ -513,6 +513,7 @@ struct sta_info *sta_info_alloc(struct ieee80211_sub_if_data *sdata, ...@@ -513,6 +513,7 @@ struct sta_info *sta_info_alloc(struct ieee80211_sub_if_data *sdata,
sta->cparams.target = MS2TIME(20); sta->cparams.target = MS2TIME(20);
sta->cparams.interval = MS2TIME(100); sta->cparams.interval = MS2TIME(100);
sta->cparams.ecn = true; sta->cparams.ecn = true;
sta->cparams.ce_threshold_ect1 = false;
sta_dbg(sdata, "Allocated STA %pM\n", sta->sta.addr); sta_dbg(sdata, "Allocated STA %pM\n", sta->sta.addr);
......
...@@ -362,6 +362,7 @@ static const struct nla_policy fq_codel_policy[TCA_FQ_CODEL_MAX + 1] = { ...@@ -362,6 +362,7 @@ static const struct nla_policy fq_codel_policy[TCA_FQ_CODEL_MAX + 1] = {
[TCA_FQ_CODEL_CE_THRESHOLD] = { .type = NLA_U32 }, [TCA_FQ_CODEL_CE_THRESHOLD] = { .type = NLA_U32 },
[TCA_FQ_CODEL_DROP_BATCH_SIZE] = { .type = NLA_U32 }, [TCA_FQ_CODEL_DROP_BATCH_SIZE] = { .type = NLA_U32 },
[TCA_FQ_CODEL_MEMORY_LIMIT] = { .type = NLA_U32 }, [TCA_FQ_CODEL_MEMORY_LIMIT] = { .type = NLA_U32 },
[TCA_FQ_CODEL_CE_THRESHOLD_ECT1] = { .type = NLA_U8 },
}; };
static int fq_codel_change(struct Qdisc *sch, struct nlattr *opt, static int fq_codel_change(struct Qdisc *sch, struct nlattr *opt,
...@@ -408,6 +409,9 @@ static int fq_codel_change(struct Qdisc *sch, struct nlattr *opt, ...@@ -408,6 +409,9 @@ static int fq_codel_change(struct Qdisc *sch, struct nlattr *opt,
q->cparams.ce_threshold = (val * NSEC_PER_USEC) >> CODEL_SHIFT; q->cparams.ce_threshold = (val * NSEC_PER_USEC) >> CODEL_SHIFT;
} }
if (tb[TCA_FQ_CODEL_CE_THRESHOLD_ECT1])
q->cparams.ce_threshold_ect1 = !!nla_get_u8(tb[TCA_FQ_CODEL_CE_THRESHOLD_ECT1]);
if (tb[TCA_FQ_CODEL_INTERVAL]) { if (tb[TCA_FQ_CODEL_INTERVAL]) {
u64 interval = nla_get_u32(tb[TCA_FQ_CODEL_INTERVAL]); u64 interval = nla_get_u32(tb[TCA_FQ_CODEL_INTERVAL]);
...@@ -544,10 +548,13 @@ static int fq_codel_dump(struct Qdisc *sch, struct sk_buff *skb) ...@@ -544,10 +548,13 @@ static int fq_codel_dump(struct Qdisc *sch, struct sk_buff *skb)
q->flows_cnt)) q->flows_cnt))
goto nla_put_failure; goto nla_put_failure;
if (q->cparams.ce_threshold != CODEL_DISABLED_THRESHOLD && if (q->cparams.ce_threshold != CODEL_DISABLED_THRESHOLD) {
nla_put_u32(skb, TCA_FQ_CODEL_CE_THRESHOLD, if (nla_put_u32(skb, TCA_FQ_CODEL_CE_THRESHOLD,
codel_time_to_us(q->cparams.ce_threshold))) codel_time_to_us(q->cparams.ce_threshold)))
goto nla_put_failure; goto nla_put_failure;
if (nla_put_u8(skb, TCA_FQ_CODEL_CE_THRESHOLD_ECT1, q->cparams.ce_threshold_ect1))
goto nla_put_failure;
}
return nla_nest_end(skb, opts); return nla_nest_end(skb, opts);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment