bpf: Improve the general precision of tnum_mul

author Nandakumar Edamana <nandakumar@nandakumar.co.in>

Tue, 26 Aug 2025 03:45:23 +0000 (09:15 +0530)

committer Andrii Nakryiko <andrii@kernel.org>

Wed, 27 Aug 2025 22:00:26 +0000 (15:00 -0700)
author Nandakumar Edamana <nandakumar@nandakumar.co.in>
Tue, 26 Aug 2025 03:45:23 +0000 (09:15 +0530)
committer Andrii Nakryiko <andrii@kernel.org>
Wed, 27 Aug 2025 22:00:26 +0000 (15:00 -0700)
diff --git a/include/linux/tnum.h b/include/linux/tnum.h

index 0ffb77ffe0e873783efc5a7fe9dc4c65167df499..c52b862dad45be949c9a1a6be508072e1462536c 100644 (file)
--- a/include/linux/tnum.h
+++ b/include/linux/tnum.h
@@ -57,6 +57,9 @@ bool tnum_overlap(struct tnum a, struct tnum b);
  /* Return a tnum representing numbers satisfying both @a and @b */
  struct tnum tnum_intersect(struct tnum a, struct tnum b);
  
+/* Returns a tnum representing numbers satisfying either @a or @b */
+struct tnum tnum_union(struct tnum t1, struct tnum t2);
+
  /* Return @a with all but the lowest @size bytes cleared */
  struct tnum tnum_cast(struct tnum a, u8 size);
  
diff --git a/kernel/bpf/tnum.c b/kernel/bpf/tnum.c

index d9328bbb3680b51bc398bb869e5d81d22895a6b2..f8e70e9c3998d475509aaf1257e2f4939e8a6995 100644 (file)
--- a/kernel/bpf/tnum.c
+++ b/kernel/bpf/tnum.c
@@ -116,31 +116,47 @@ struct tnum tnum_xor(struct tnum a, struct tnum b)
         return TNUM(v & ~mu, mu);
  }
  
-/* Generate partial products by multiplying each bit in the multiplier (tnum a)
- * with the multiplicand (tnum b), and add the partial products after
- * appropriately bit-shifting them. Instead of directly performing tnum addition
- * on the generated partial products, equivalenty, decompose each partial
- * product into two tnums, consisting of the value-sum (acc_v) and the
- * mask-sum (acc_m) and then perform tnum addition on them. The following paper
- * explains the algorithm in more detail: https://arxiv.org/abs/2105.05398.
+/* Perform long multiplication, iterating through the bits in a using rshift:
+ * - if LSB(a) is a known 0, keep current accumulator
+ * - if LSB(a) is a known 1, add b to current accumulator
+ * - if LSB(a) is unknown, take a union of the above cases.
+ *
+ * For example:
+ *
+ *               acc_0:        acc_1:
+ *
+ *     11 *  ->      11 *  ->      11 *  -> union(0011, 1001) == x0x1
+ *     x1            01            11
+ * ------        ------        ------
+ *     11            11            11
+ *    xx            00            11
+ * ------        ------        ------
+ *   ????          0011          1001
   */
  struct tnum tnum_mul(struct tnum a, struct tnum b)
  {
-       u64 acc_v = a.value * b.value;
-       struct tnum acc_m = TNUM(0, 0);
+       struct tnum acc = TNUM(0, 0);
  
         while (a.value || a.mask) {
                 /* LSB of tnum a is a certain 1 */
                 if (a.value & 1)
-                       acc_m = tnum_add(acc_m, TNUM(0, b.mask));
+                       acc = tnum_add(acc, b);
                 /* LSB of tnum a is uncertain */
-               else if (a.mask & 1)
-                       acc_m = tnum_add(acc_m, TNUM(0, b.value | b.mask));
+               else if (a.mask & 1) {
+                       /* acc = tnum_union(acc_0, acc_1), where acc_0 and
+                        * acc_1 are partial accumulators for cases
+                        * LSB(a) = certain 0 and LSB(a) = certain 1.
+                        * acc_0 = acc + 0 * b = acc.
+                        * acc_1 = acc + 1 * b = tnum_add(acc, b).
+                        */
+
+                       acc = tnum_union(acc, tnum_add(acc, b));
+               }
                 /* Note: no case for LSB is certain 0 */
                 a = tnum_rshift(a, 1);
                 b = tnum_lshift(b, 1);
         }
-       return tnum_add(TNUM(acc_v, 0), acc_m);
+       return acc;
  }
  
  bool tnum_overlap(struct tnum a, struct tnum b)
@@ -163,6 +179,19 @@ struct tnum tnum_intersect(struct tnum a, struct tnum b)
         return TNUM(v & ~mu, mu);
  }
  
+/* Returns a tnum with the uncertainty from both a and b, and in addition, new
+ * uncertainty at any position that a and b disagree. This represents a
+ * superset of the union of the concrete sets of both a and b. Despite the
+ * overapproximation, it is optimal.
+ */
+struct tnum tnum_union(struct tnum a, struct tnum b)
+{
+       u64 v = a.value & b.value;
+       u64 mu = (a.value ^ b.value) | a.mask | b.mask;
+
+       return TNUM(v & ~mu, mu);
+}
+
  struct tnum tnum_cast(struct tnum a, u8 size)
  {
         a.value &= (1ULL << (size * 8)) - 1;
author	Nandakumar Edamana <nandakumar@nandakumar.co.in>
	Tue, 26 Aug 2025 03:45:23 +0000 (09:15 +0530)
committer	Andrii Nakryiko <andrii@kernel.org>
	Wed, 27 Aug 2025 22:00:26 +0000 (15:00 -0700)
include/linux/tnum.h		patch \| blob \| history
kernel/bpf/tnum.c		patch \| blob \| history