Thread (39 messages) 39 messages, 9 authors, 2012-03-05

Re: [PATCH v12 01/13] sk_run_filter: add support for custom load_pointer

From: Will Drewry <wad@chromium.org>
Date: 2012-03-02 18:47:58
Also in: lkml, netdev

On Fri, Mar 2, 2012 at 4:40 AM, Indan Zupancic [off-list ref] wrote:
quoted hunk ↗ jump to hunk
Hello,

On Thu, March 1, 2012 00:53, Will Drewry wrote:
quoted
 include/linux/filter.h |   46 +++++++++++++++++++
 net/core/filter.c      |  117 +++++++++++++++++++++++++++++++++++++++++++++---
 2 files changed, 157 insertions(+), 6 deletions(-)
I propose a slightly different approach:

Instead of more or less allowing generic load instructions, do the
same as the ancillary data functions and only allow BPF_S_LD_W_ABS.
In addition to that, rewrite and check the functions ourself after
sk_chk_filter() has done its checks.

Diff for filter.c:
diff --git a/include/linux/filter.h b/include/linux/filter.h
index 8eeb205..63b728c 100644
--- a/include/linux/filter.h
+++ b/include/linux/filter.h
@@ -228,6 +228,7 @@ enum {
       BPF_S_ANC_HATYPE,
       BPF_S_ANC_RXHASH,
       BPF_S_ANC_CPU,
+       BPF_S_LD_W_SECCOMP,
 };

 #endif /* __KERNEL__ */
diff --git a/net/core/filter.c b/net/core/filter.c
index 5dea452..7e338d6 100644
--- a/net/core/filter.c
+++ b/net/core/filter.c
@@ -350,6 +350,9 @@ load_b:
                               A = 0;
                       continue;
               }
+               case BPF_S_LD_W_SECCOMP:
+                       A = seccomp_load(fentry->k);
+                       continue;
This is plenty nice as far as I'm concerned.  I wonder what the
networking people think?

I proposed a generic bpf interface, but if simply scoping it down to a
single additional seccomp instruction is okay, then we can address
additional instruction support or other generalizations later when
there is a motivating case.

               default:
                       WARN_RATELIMIT(1, "Unknown code:%u jt:%u tf:%u k:%u\n",
                                      fentry->code, fentry->jt,
---

And in seccomp add something like:

/*
 * Does SECCOMP specific checks.
 * Should be called after sk_chk_filter(), as it assumes all instructions
 * are rewritten to the kernel enum format.
 * No SKB touching instructions are allowed. Only data LD instruction allowed
 * is BPF_S_LD_W_ABS, which will be handled by seccomp_load().
 */
int seccomp_check_filter(const struct sock_filter *filter, unsigned int flen)
{
       int pc;

       /* Make sure there are no SKB using instructions */
       for (pc = 0; pc < flen; pc++) {
               u16 code = filter->code;
               unsigned int k = filter->k;

               if (code <= BPF_S_ALU_NEG)
                       continue;
               if (code >= BPF_S_LDX_IMM && code < BPF_S_ANC_PROTOCOL)
                       continue;
               switch (code) {
               case BPF_S_LD_W_ABS:
                       filter->code = BPF_S_LD_W_SECCOMP;
                       if (k >= sizeof(struct seccomp_data) || k & 3)
                               return -EINVAL;
                       continue;
               case BPF_S_LD_W_LEN:
                       filter->code = BPF_S_LD_IMM;
                       filter->k = sizeof(struct seccomp_data);
                       continue;
               case BPF_S_LD_IMM:
                       continue;
               case BPF_S_LDX_W_LEN:
                       filter->code = BPF_S_LDX_IMM;
                       filter->k = sizeof(struct seccomp_data);
Mapping to LD[X]_IMM is really nice.
                       continue;
               default:
                       return -EINVAL;
               }
       }
       return 0;
}

u32 seccomp_load(int off)
{
       u32 A;
       struct pt_regs *regs = task_pt_regs(current);

       if (off >= BPF_DATA(args[0]) && off < BPF_DATA(args[6])) {
               int arg = (off - BPF_DATA(args[0])) / sizeof(u64);
               int index = (off % sizeof(u64)) ? 1 : 0;
               syscall_get_arguments(current, regs, arg, 1, &value);
               A = get_u32(value, index);
       } else if (off == BPF_DATA(nr)) {
               A = syscall_get_nr(current, regs);
       } else if (off == BPF_DATA(arch)) {
               A = syscall_get_arch(current, regs);
       } else if (off == BPF_DATA(instruction_pointer)) {
               A = get_u32(KSTK_EIP(current), 0);
       } else if (off == BPF_DATA(instruction_pointer) + sizeof(u32)) {
               A = get_u32(KSTK_EIP(current), 1);
       }
       return A;
}

This way you can even add SECCOMP specific functions in the future by using
special offsets. (E.g. 64-bit compare between an arg and scratch memory.)
Yeah this would be a nice option if a more specialized (yet less
invasive) approach is appealing to the networking people.  Eric, Joe,
netdev, ... any opinions?  Would a standalone version be more useful?

Thanks!
will
Keyboard shortcuts
hback out one level
jnext message in thread
kprevious message in thread
ldrill in
Escclose help / fold thread tree
?toggle this help