bpf: fix cb access in socket filter programs

author Alexei Starovoitov <ast@plumgrid.com>

Wed, 7 Oct 2015 17:55:41 +0000 (10:55 -0700)

committer David S. Miller <davem@davemloft.net>

Sun, 11 Oct 2015 11:40:05 +0000 (04:40 -0700)
author Alexei Starovoitov <ast@plumgrid.com>
Wed, 7 Oct 2015 17:55:41 +0000 (10:55 -0700)
committer David S. Miller <davem@davemloft.net>
Sun, 11 Oct 2015 11:40:05 +0000 (04:40 -0700)
diff --git a/include/linux/bpf.h b/include/linux/bpf.h

index 3697ad5638996e086e79e4560f6042ca3d35b4de..b4fdee6cb68612a4eb7039b9f815f219b8ee5eca 100644 (file)
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -100,6 +100,8 @@ enum bpf_access_type {
         BPF_WRITE = 2
  };
  
+struct bpf_prog;
+
  struct bpf_verifier_ops {
         /* return eBPF function prototype for verification */
         const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
@@ -111,7 +113,7 @@ struct bpf_verifier_ops {
  
         u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg,
                                   int src_reg, int ctx_off,
-                                 struct bpf_insn *insn);
+                                 struct bpf_insn *insn, struct bpf_prog *prog);
  };
  
  struct bpf_prog_type_list {
@@ -120,8 +122,6 @@ struct bpf_prog_type_list {
         enum bpf_prog_type type;
  };
  
-struct bpf_prog;
-
  struct bpf_prog_aux {
         atomic_t refcnt;
         u32 used_map_cnt;
diff --git a/include/linux/filter.h b/include/linux/filter.h

index 1bbce14bcf17975b3b4089f0a0e87ef99047f7b7..4165e9ac9e36aa82735f40a790e25e0b7218c95b 100644 (file)
--- a/include/linux/filter.h
+++ b/include/linux/filter.h
@@ -13,6 +13,7 @@
  #include <linux/printk.h>
  #include <linux/workqueue.h>
  #include <linux/sched.h>
+#include <net/sch_generic.h>
  
  #include <asm/cacheflush.h>
  
@@ -302,10 +303,6 @@ struct bpf_prog_aux;
         bpf_size;                                               \
  })
  
-/* Macro to invoke filter function. */
-#define SK_RUN_FILTER(filter, ctx) \
-       (*filter->prog->bpf_func)(ctx, filter->prog->insnsi)
-
  #ifdef CONFIG_COMPAT
  /* A struct sock_filter is architecture independent. */
  struct compat_sock_fprog {
@@ -329,6 +326,7 @@ struct bpf_prog {
         kmemcheck_bitfield_begin(meta);
         u16                     jited:1,        /* Is our filter JIT'ed? */
                                 gpl_compatible:1, /* Is filter GPL compatible? */
+                               cb_access:1,    /* Is control block accessed? */
                                 dst_needed:1;   /* Do we need dst entry? */
         kmemcheck_bitfield_end(meta);
         u32                     len;            /* Number of filter blocks */
@@ -352,6 +350,39 @@ struct sk_filter {
  
  #define BPF_PROG_RUN(filter, ctx)  (*filter->bpf_func)(ctx, filter->insnsi)
  
+static inline u32 bpf_prog_run_save_cb(const struct bpf_prog *prog,
+                                      struct sk_buff *skb)
+{
+       u8 *cb_data = qdisc_skb_cb(skb)->data;
+       u8 saved_cb[QDISC_CB_PRIV_LEN];
+       u32 res;
+
+       BUILD_BUG_ON(FIELD_SIZEOF(struct __sk_buff, cb) !=
+                    QDISC_CB_PRIV_LEN);
+
+       if (unlikely(prog->cb_access)) {
+               memcpy(saved_cb, cb_data, sizeof(saved_cb));
+               memset(cb_data, 0, sizeof(saved_cb));
+       }
+
+       res = BPF_PROG_RUN(prog, skb);
+
+       if (unlikely(prog->cb_access))
+               memcpy(cb_data, saved_cb, sizeof(saved_cb));
+
+       return res;
+}
+
+static inline u32 bpf_prog_run_clear_cb(const struct bpf_prog *prog,
+                                       struct sk_buff *skb)
+{
+       u8 *cb_data = qdisc_skb_cb(skb)->data;
+
+       if (unlikely(prog->cb_access))
+               memset(cb_data, 0, QDISC_CB_PRIV_LEN);
+       return BPF_PROG_RUN(prog, skb);
+}
+
  static inline unsigned int bpf_prog_size(unsigned int proglen)
  {
         return max(sizeof(struct bpf_prog),
diff --git a/kernel/bpf/verifier.c b/kernel/bpf/verifier.c

index b074b23000d6e95792e7fcefe0cd29e5a649a6ea..f8da034c225822a59db5529c4675dacba26146c5 100644 (file)
--- a/kernel/bpf/verifier.c
+++ b/kernel/bpf/verifier.c
@@ -2024,7 +2024,7 @@ static int convert_ctx_accesses(struct verifier_env *env)
  
                 cnt = env->prog->aux->ops->
                         convert_ctx_access(type, insn->dst_reg, insn->src_reg,
-                                          insn->off, insn_buf);
+                                          insn->off, insn_buf, env->prog);
                 if (cnt == 0 || cnt >= ARRAY_SIZE(insn_buf)) {
                         verbose("bpf verifier is misconfigured\n");
                         return -EINVAL;
diff --git a/net/core/filter.c b/net/core/filter.c

index 342e6c8fc415bb6a565b62d22363161208aae8e0..5f4cf1cffed366c400104e61b032d95de1591edf 100644 (file)
--- a/net/core/filter.c
+++ b/net/core/filter.c
@@ -56,10 +56,10 @@
   *     @sk: sock associated with &sk_buff
   *     @skb: buffer to filter
   *
- * Run the filter code and then cut skb->data to correct size returned by
- * SK_RUN_FILTER. If pkt_len is 0 we toss packet. If skb->len is smaller
+ * Run the eBPF program and then cut skb->data to correct size returned by
+ * the program. If pkt_len is 0 we toss packet. If skb->len is smaller
   * than pkt_len we keep whole skb->data. This is the socket level
- * wrapper to SK_RUN_FILTER. It returns 0 if the packet should
+ * wrapper to BPF_PROG_RUN. It returns 0 if the packet should
   * be accepted or -EPERM if the packet should be tossed.
   *
   */
@@ -83,7 +83,7 @@ int sk_filter(struct sock *sk, struct sk_buff *skb)
         rcu_read_lock();
         filter = rcu_dereference(sk->sk_filter);
         if (filter) {
-               unsigned int pkt_len = SK_RUN_FILTER(filter, skb);
+               unsigned int pkt_len = bpf_prog_run_save_cb(filter->prog, skb);
  
                 err = pkt_len ? pskb_trim(skb, pkt_len) : -EPERM;
         }
@@ -1736,7 +1736,8 @@ static bool tc_cls_act_is_valid_access(int off, int size,
  
  static u32 bpf_net_convert_ctx_access(enum bpf_access_type type, int dst_reg,
                                       int src_reg, int ctx_off,
-                                     struct bpf_insn *insn_buf)
+                                     struct bpf_insn *insn_buf,
+                                     struct bpf_prog *prog)
  {
         struct bpf_insn *insn = insn_buf;
  
@@ -1827,6 +1828,7 @@ static u32 bpf_net_convert_ctx_access(enum bpf_access_type type, int dst_reg,
                 offsetof(struct __sk_buff, cb[4]):
                 BUILD_BUG_ON(FIELD_SIZEOF(struct qdisc_skb_cb, data) < 20);
  
+               prog->cb_access = 1;
                 ctx_off -= offsetof(struct __sk_buff, cb[0]);
                 ctx_off += offsetof(struct sk_buff, cb);
                 ctx_off += offsetof(struct qdisc_skb_cb, data);
diff --git a/net/packet/af_packet.c b/net/packet/af_packet.c

index 81c900fbc4a409e4f75a349b4f29d195845a165a..104910f7d1fb644117575d0163b80b659923c99d 100644 (file)
--- a/net/packet/af_packet.c
+++ b/net/packet/af_packet.c
@@ -1423,7 +1423,7 @@ static unsigned int fanout_demux_bpf(struct packet_fanout *f,
         rcu_read_lock();
         prog = rcu_dereference(f->bpf_prog);
         if (prog)
-               ret = BPF_PROG_RUN(prog, skb) % num;
+               ret = bpf_prog_run_clear_cb(prog, skb) % num;
         rcu_read_unlock();
  
         return ret;
@@ -1939,16 +1939,16 @@ out_free:
         return err;
  }
  
-static unsigned int run_filter(const struct sk_buff *skb,
-                                     const struct sock *sk,
-                                     unsigned int res)
+static unsigned int run_filter(struct sk_buff *skb,
+                              const struct sock *sk,
+                              unsigned int res)
  {
         struct sk_filter *filter;
  
         rcu_read_lock();
         filter = rcu_dereference(sk->sk_filter);
         if (filter != NULL)
-               res = SK_RUN_FILTER(filter, skb);
+               res = bpf_prog_run_clear_cb(filter->prog, skb);
         rcu_read_unlock();
  
         return res;
author	Alexei Starovoitov <ast@plumgrid.com>
	Wed, 7 Oct 2015 17:55:41 +0000 (10:55 -0700)
committer	David S. Miller <davem@davemloft.net>
	Sun, 11 Oct 2015 11:40:05 +0000 (04:40 -0700)
include/linux/bpf.h		patch \| blob \| history
include/linux/filter.h		patch \| blob \| history
kernel/bpf/verifier.c		patch \| blob \| history
net/core/filter.c		patch \| blob \| history
net/packet/af_packet.c		patch \| blob \| history