2 * Seccomp filter example for x86 (32-bit and 64-bit) with BPF macros
4 * Copyright (c) 2012 The Chromium OS Authors <chromium-os-dev@chromium.org>
5 * Author: Will Drewry <wad@chromium.org>
7 * The code may be used by anyone for any purpose,
8 * and can serve as a starting point for developing
9 * applications using prctl(PR_SET_SECCOMP, 2, ...).
11 #if defined(__i386__) || defined(__x86_64__)
12 #define SUPPORTED_ARCH 1
15 #if defined(SUPPORTED_ARCH)
19 #include <linux/types.h>
20 #include <linux/filter.h>
21 #include <linux/seccomp.h>
22 #include <linux/unistd.h>
27 #include <sys/prctl.h>
30 #define syscall_arg(_n) (offsetof(struct seccomp_data, args[_n]))
31 #define syscall_nr (offsetof(struct seccomp_data, nr))
34 #define REG_RESULT REG_EAX
35 #define REG_SYSCALL REG_EAX
36 #define REG_ARG0 REG_EBX
37 #define REG_ARG1 REG_ECX
38 #define REG_ARG2 REG_EDX
39 #define REG_ARG3 REG_ESI
40 #define REG_ARG4 REG_EDI
41 #define REG_ARG5 REG_EBP
42 #elif defined(__x86_64__)
43 #define REG_RESULT REG_RAX
44 #define REG_SYSCALL REG_RAX
45 #define REG_ARG0 REG_RDI
46 #define REG_ARG1 REG_RSI
47 #define REG_ARG2 REG_RDX
48 #define REG_ARG3 REG_R10
49 #define REG_ARG4 REG_R8
50 #define REG_ARG5 REG_R9
53 #ifndef PR_SET_NO_NEW_PRIVS
54 #define PR_SET_NO_NEW_PRIVS 38
61 static void emulator(int nr, siginfo_t *info, void *void_context)
63 ucontext_t *ctx = (ucontext_t *)(void_context);
68 if (info->si_code != SYS_SECCOMP)
72 syscall = ctx->uc_mcontext.gregs[REG_SYSCALL];
73 buf = (char *) ctx->uc_mcontext.gregs[REG_ARG1];
74 len = (size_t) ctx->uc_mcontext.gregs[REG_ARG2];
76 if (syscall != __NR_write)
78 if (ctx->uc_mcontext.gregs[REG_ARG0] != STDERR_FILENO)
80 /* Redirect stderr messages to stdout. Doesn't handle EINTR, etc */
81 ctx->uc_mcontext.gregs[REG_RESULT] = -1;
82 if (write(STDOUT_FILENO, "[ERR] ", 6) > 0) {
83 bytes = write(STDOUT_FILENO, buf, len);
84 ctx->uc_mcontext.gregs[REG_RESULT] = bytes;
89 static int install_emulator(void)
93 memset(&act, 0, sizeof(act));
95 sigaddset(&mask, SIGSYS);
97 act.sa_sigaction = &emulator;
98 act.sa_flags = SA_SIGINFO;
99 if (sigaction(SIGSYS, &act, NULL) < 0) {
103 if (sigprocmask(SIG_UNBLOCK, &mask, NULL)) {
104 perror("sigprocmask");
110 static int install_filter(void)
112 struct sock_filter filter[] = {
113 /* Grab the system call number */
114 BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_nr),
115 /* Jump table for the allowed syscalls */
116 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_rt_sigreturn, 0, 1),
117 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
118 #ifdef __NR_sigreturn
119 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_sigreturn, 0, 1),
120 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
122 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit_group, 0, 1),
123 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
124 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit, 0, 1),
125 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
126 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_read, 1, 0),
127 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_write, 3, 2),
129 /* Check that read is only using stdin. */
130 BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)),
131 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDIN_FILENO, 4, 0),
132 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL),
134 /* Check that write is only using stdout */
135 BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)),
136 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDOUT_FILENO, 1, 0),
137 /* Trap attempts to write to stderr */
138 BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDERR_FILENO, 1, 2),
140 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
141 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_TRAP),
142 BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL),
144 struct sock_fprog prog = {
145 .len = (unsigned short)(sizeof(filter)/sizeof(filter[0])),
149 if (prctl(PR_SET_NO_NEW_PRIVS, 1, 0, 0, 0)) {
150 perror("prctl(NO_NEW_PRIVS)");
155 if (prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &prog)) {
162 #define payload(_c) (_c), sizeof((_c))
163 int main(int argc, char **argv)
167 if (install_emulator())
169 if (install_filter())
171 syscall(__NR_write, STDOUT_FILENO,
172 payload("OHAI! WHAT IS YOUR NAME? "));
173 bytes = syscall(__NR_read, STDIN_FILENO, buf, sizeof(buf));
174 syscall(__NR_write, STDOUT_FILENO, payload("HELLO, "));
175 syscall(__NR_write, STDOUT_FILENO, buf, bytes);
176 syscall(__NR_write, STDERR_FILENO,
177 payload("Error message going to STDERR\n"));
180 #else /* SUPPORTED_ARCH */
182 * This sample is x86-only. Since kernel samples are compiled with the
183 * host toolchain, a non-x86 host will result in using only the main()
190 #endif /* SUPPORTED_ARCH */