]> www.infradead.org Git - users/hch/misc.git/commitdiff
tcp: accecn: AccECN option ceb/cep and ACE field multi-wrap heuristics
authorIlpo Järvinen <ij@kernel.org>
Tue, 16 Sep 2025 08:24:33 +0000 (10:24 +0200)
committerPaolo Abeni <pabeni@redhat.com>
Thu, 18 Sep 2025 06:47:52 +0000 (08:47 +0200)
The AccECN option ceb/cep heuristic algorithm is from AccECN spec
Appendix A.2.2 to mitigate against false ACE field overflows. Armed
with ceb delta from option, delivered bytes, and delivered packets it
is possible to estimate how many times ACE field wrapped.

This calculation is necessary only if more than one wrap is possible.
Without SACK, delivered bytes and packets are not always trustworthy in
which case TCP falls back to the simpler no-or-all wraps ceb algorithm.

Signed-off-by: Ilpo Järvinen <ij@kernel.org>
Signed-off-by: Chia-Yu Chang <chia-yu.chang@nokia-bell-labs.com>
Acked-by: Paolo Abeni <pabeni@redhat.com>
Reviewed-by: Eric Dumazet <edumazet@google.com>
Link: https://patch.msgid.link/20250916082434.100722-10-chia-yu.chang@nokia-bell-labs.com
Signed-off-by: Paolo Abeni <pabeni@redhat.com>
include/net/tcp.h
net/ipv4/tcp_input.c

index 78dd7b8a414520354e303de3ce059c6faa27f01c..7c51a0a5ace820bd45d4cc551a15154f8488a880 100644 (file)
@@ -256,6 +256,7 @@ static_assert((1 << ATO_BITS) > TCP_DELACK_MAX);
 #define TCP_ACCECN_MAXSIZE             (TCPOLEN_ACCECN_BASE + \
                                         TCPOLEN_ACCECN_PERFIELD * \
                                         TCP_ACCECN_NUMFIELDS)
+#define TCP_ACCECN_SAFETY_SHIFT                1 /* SAFETY_FACTOR in accecn draft */
 
 /* Flags in tp->nonagle */
 #define TCP_NAGLE_OFF          1       /* Nagle's algo is disabled */
index 5732f2d4329c40f361df2e5636f57a61cbb82e9c..9fdc6ce25eb1035a88ff2640601cc665187a78b2 100644 (file)
@@ -493,16 +493,19 @@ static u32 __tcp_accecn_process(struct sock *sk, const struct sk_buff *skb,
                                u32 delivered_pkts, u32 delivered_bytes,
                                int flag)
 {
+       u32 old_ceb = tcp_sk(sk)->delivered_ecn_bytes[INET_ECN_CE - 1];
        const struct tcphdr *th = tcp_hdr(skb);
        struct tcp_sock *tp = tcp_sk(sk);
-       u32 delta, safe_delta;
+       u32 delta, safe_delta, d_ceb;
+       bool opt_deltas_valid;
        u32 corrected_ace;
 
        /* Reordered ACK or uncertain due to lack of data to send and ts */
        if (!(flag & (FLAG_FORWARD_PROGRESS | FLAG_TS_PROGRESS)))
                return 0;
 
-       tcp_accecn_process_option(tp, skb, delivered_bytes, flag);
+       opt_deltas_valid = tcp_accecn_process_option(tp, skb,
+                                                    delivered_bytes, flag);
 
        if (!(flag & FLAG_SLOWPATH)) {
                /* AccECN counter might overflow on large ACKs */
@@ -525,6 +528,35 @@ static u32 __tcp_accecn_process(struct sock *sk, const struct sk_buff *skb,
        safe_delta = delivered_pkts -
                     ((delivered_pkts - delta) & TCP_ACCECN_CEP_ACE_MASK);
 
+       if (opt_deltas_valid) {
+               d_ceb = tp->delivered_ecn_bytes[INET_ECN_CE - 1] - old_ceb;
+               if (!d_ceb)
+                       return delta;
+
+               if ((delivered_pkts >= (TCP_ACCECN_CEP_ACE_MASK + 1) * 2) &&
+                   (tcp_is_sack(tp) ||
+                    ((1 << inet_csk(sk)->icsk_ca_state) &
+                     (TCPF_CA_Open | TCPF_CA_CWR)))) {
+                       u32 est_d_cep;
+
+                       if (delivered_bytes <= d_ceb)
+                               return safe_delta;
+
+                       est_d_cep = DIV_ROUND_UP_ULL((u64)d_ceb *
+                                                    delivered_pkts,
+                                                    delivered_bytes);
+                       return min(safe_delta,
+                                  delta +
+                                  (est_d_cep & ~TCP_ACCECN_CEP_ACE_MASK));
+               }
+
+               if (d_ceb > delta * tp->mss_cache)
+                       return safe_delta;
+               if (d_ceb <
+                   safe_delta * tp->mss_cache >> TCP_ACCECN_SAFETY_SHIFT)
+                       return delta;
+       }
+
        return safe_delta;
 }