| 
									
										
										
										
											2012-04-12 16:48:04 -05:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * Seccomp filter example for x86 (32-bit and 64-bit) with BPF macros | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Copyright (c) 2012 The Chromium OS Authors <chromium-os-dev@chromium.org> | 
					
						
							|  |  |  |  * Author: Will Drewry <wad@chromium.org> | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * The code may be used by anyone for any purpose, | 
					
						
							|  |  |  |  * and can serve as a starting point for developing | 
					
						
							|  |  |  |  * applications using prctl(PR_SET_SECCOMP, 2, ...). | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2012-04-18 19:50:25 -05:00
										 |  |  | #if defined(__i386__) || defined(__x86_64__)
 | 
					
						
							|  |  |  | #define SUPPORTED_ARCH 1
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #if defined(SUPPORTED_ARCH)
 | 
					
						
							| 
									
										
										
										
											2012-04-12 16:48:04 -05:00
										 |  |  | #define __USE_GNU 1
 | 
					
						
							|  |  |  | #define _GNU_SOURCE 1
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <linux/types.h>
 | 
					
						
							|  |  |  | #include <linux/filter.h>
 | 
					
						
							|  |  |  | #include <linux/seccomp.h>
 | 
					
						
							|  |  |  | #include <linux/unistd.h>
 | 
					
						
							|  |  |  | #include <signal.h>
 | 
					
						
							|  |  |  | #include <stdio.h>
 | 
					
						
							|  |  |  | #include <stddef.h>
 | 
					
						
							|  |  |  | #include <string.h>
 | 
					
						
							|  |  |  | #include <sys/prctl.h>
 | 
					
						
							|  |  |  | #include <unistd.h>
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #define syscall_arg(_n) (offsetof(struct seccomp_data, args[_n]))
 | 
					
						
							|  |  |  | #define syscall_nr (offsetof(struct seccomp_data, nr))
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #if defined(__i386__)
 | 
					
						
							|  |  |  | #define REG_RESULT	REG_EAX
 | 
					
						
							|  |  |  | #define REG_SYSCALL	REG_EAX
 | 
					
						
							|  |  |  | #define REG_ARG0	REG_EBX
 | 
					
						
							|  |  |  | #define REG_ARG1	REG_ECX
 | 
					
						
							|  |  |  | #define REG_ARG2	REG_EDX
 | 
					
						
							|  |  |  | #define REG_ARG3	REG_ESI
 | 
					
						
							|  |  |  | #define REG_ARG4	REG_EDI
 | 
					
						
							|  |  |  | #define REG_ARG5	REG_EBP
 | 
					
						
							|  |  |  | #elif defined(__x86_64__)
 | 
					
						
							|  |  |  | #define REG_RESULT	REG_RAX
 | 
					
						
							|  |  |  | #define REG_SYSCALL	REG_RAX
 | 
					
						
							|  |  |  | #define REG_ARG0	REG_RDI
 | 
					
						
							|  |  |  | #define REG_ARG1	REG_RSI
 | 
					
						
							|  |  |  | #define REG_ARG2	REG_RDX
 | 
					
						
							|  |  |  | #define REG_ARG3	REG_R10
 | 
					
						
							|  |  |  | #define REG_ARG4	REG_R8
 | 
					
						
							|  |  |  | #define REG_ARG5	REG_R9
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifndef PR_SET_NO_NEW_PRIVS
 | 
					
						
							|  |  |  | #define PR_SET_NO_NEW_PRIVS 38
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifndef SYS_SECCOMP
 | 
					
						
							|  |  |  | #define SYS_SECCOMP 1
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static void emulator(int nr, siginfo_t *info, void *void_context) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	ucontext_t *ctx = (ucontext_t *)(void_context); | 
					
						
							|  |  |  | 	int syscall; | 
					
						
							|  |  |  | 	char *buf; | 
					
						
							|  |  |  | 	ssize_t bytes; | 
					
						
							|  |  |  | 	size_t len; | 
					
						
							|  |  |  | 	if (info->si_code != SYS_SECCOMP) | 
					
						
							|  |  |  | 		return; | 
					
						
							|  |  |  | 	if (!ctx) | 
					
						
							|  |  |  | 		return; | 
					
						
							|  |  |  | 	syscall = ctx->uc_mcontext.gregs[REG_SYSCALL]; | 
					
						
							|  |  |  | 	buf = (char *) ctx->uc_mcontext.gregs[REG_ARG1]; | 
					
						
							|  |  |  | 	len = (size_t) ctx->uc_mcontext.gregs[REG_ARG2]; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (syscall != __NR_write) | 
					
						
							|  |  |  | 		return; | 
					
						
							|  |  |  | 	if (ctx->uc_mcontext.gregs[REG_ARG0] != STDERR_FILENO) | 
					
						
							|  |  |  | 		return; | 
					
						
							|  |  |  | 	/* Redirect stderr messages to stdout. Doesn't handle EINTR, etc */ | 
					
						
							|  |  |  | 	ctx->uc_mcontext.gregs[REG_RESULT] = -1; | 
					
						
							|  |  |  | 	if (write(STDOUT_FILENO, "[ERR] ", 6) > 0) { | 
					
						
							|  |  |  | 		bytes = write(STDOUT_FILENO, buf, len); | 
					
						
							|  |  |  | 		ctx->uc_mcontext.gregs[REG_RESULT] = bytes; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static int install_emulator(void) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	struct sigaction act; | 
					
						
							|  |  |  | 	sigset_t mask; | 
					
						
							|  |  |  | 	memset(&act, 0, sizeof(act)); | 
					
						
							|  |  |  | 	sigemptyset(&mask); | 
					
						
							|  |  |  | 	sigaddset(&mask, SIGSYS); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	act.sa_sigaction = &emulator; | 
					
						
							|  |  |  | 	act.sa_flags = SA_SIGINFO; | 
					
						
							|  |  |  | 	if (sigaction(SIGSYS, &act, NULL) < 0) { | 
					
						
							|  |  |  | 		perror("sigaction"); | 
					
						
							|  |  |  | 		return -1; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	if (sigprocmask(SIG_UNBLOCK, &mask, NULL)) { | 
					
						
							|  |  |  | 		perror("sigprocmask"); | 
					
						
							|  |  |  | 		return -1; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return 0; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static int install_filter(void) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	struct sock_filter filter[] = { | 
					
						
							|  |  |  | 		/* Grab the system call number */ | 
					
						
							|  |  |  | 		BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_nr), | 
					
						
							|  |  |  | 		/* Jump table for the allowed syscalls */ | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_rt_sigreturn, 0, 1), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW), | 
					
						
							|  |  |  | #ifdef __NR_sigreturn
 | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_sigreturn, 0, 1), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW), | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit_group, 0, 1), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW), | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit, 0, 1), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW), | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_read, 1, 0), | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_write, 3, 2), | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* Check that read is only using stdin. */ | 
					
						
							|  |  |  | 		BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)), | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDIN_FILENO, 4, 0), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL), | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* Check that write is only using stdout */ | 
					
						
							|  |  |  | 		BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)), | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDOUT_FILENO, 1, 0), | 
					
						
							|  |  |  | 		/* Trap attempts to write to stderr */ | 
					
						
							|  |  |  | 		BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDERR_FILENO, 1, 2), | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_TRAP), | 
					
						
							|  |  |  | 		BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL), | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 	struct sock_fprog prog = { | 
					
						
							|  |  |  | 		.len = (unsigned short)(sizeof(filter)/sizeof(filter[0])), | 
					
						
							|  |  |  | 		.filter = filter, | 
					
						
							|  |  |  | 	}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (prctl(PR_SET_NO_NEW_PRIVS, 1, 0, 0, 0)) { | 
					
						
							|  |  |  | 		perror("prctl(NO_NEW_PRIVS)"); | 
					
						
							|  |  |  | 		return 1; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &prog)) { | 
					
						
							|  |  |  | 		perror("prctl"); | 
					
						
							|  |  |  | 		return 1; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return 0; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #define payload(_c) (_c), sizeof((_c))
 | 
					
						
							|  |  |  | int main(int argc, char **argv) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	char buf[4096]; | 
					
						
							|  |  |  | 	ssize_t bytes = 0; | 
					
						
							|  |  |  | 	if (install_emulator()) | 
					
						
							|  |  |  | 		return 1; | 
					
						
							|  |  |  | 	if (install_filter()) | 
					
						
							|  |  |  | 		return 1; | 
					
						
							|  |  |  | 	syscall(__NR_write, STDOUT_FILENO, | 
					
						
							|  |  |  | 		payload("OHAI! WHAT IS YOUR NAME? ")); | 
					
						
							|  |  |  | 	bytes = syscall(__NR_read, STDIN_FILENO, buf, sizeof(buf)); | 
					
						
							|  |  |  | 	syscall(__NR_write, STDOUT_FILENO, payload("HELLO, ")); | 
					
						
							|  |  |  | 	syscall(__NR_write, STDOUT_FILENO, buf, bytes); | 
					
						
							|  |  |  | 	syscall(__NR_write, STDERR_FILENO, | 
					
						
							|  |  |  | 		payload("Error message going to STDERR\n")); | 
					
						
							|  |  |  | 	return 0; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2012-04-18 19:50:25 -05:00
										 |  |  | #else	/* SUPPORTED_ARCH */
 | 
					
						
							|  |  |  | /*
 | 
					
						
							|  |  |  |  * This sample is x86-only.  Since kernel samples are compiled with the | 
					
						
							|  |  |  |  * host toolchain, a non-x86 host will result in using only the main() | 
					
						
							|  |  |  |  * below. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | int main(void) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return 1; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | #endif	/* SUPPORTED_ARCH */
 |