root/samples/seccomp/bpf-direct.c
// SPDX-License-Identifier: GPL-2.0
/*
 * Seccomp filter example for x86 (32-bit and 64-bit) with BPF macros
 *
 * Copyright (c) 2012 The Chromium OS Authors <chromium-os-dev@chromium.org>
 * Author: Will Drewry <wad@chromium.org>
 *
 * The code may be used by anyone for any purpose,
 * and can serve as a starting point for developing
 * applications using prctl(PR_SET_SECCOMP, 2, ...).
 */
#if defined(__i386__) || defined(__x86_64__)
#define SUPPORTED_ARCH 1
#endif

#if defined(SUPPORTED_ARCH)
#define __USE_GNU 1
#define _GNU_SOURCE 1

#include <linux/types.h>
#include <linux/filter.h>
#include <linux/seccomp.h>
#include <linux/unistd.h>
#include <signal.h>
#include <stdio.h>
#include <stddef.h>
#include <string.h>
#include <sys/prctl.h>
#include <unistd.h>

#define syscall_arg(_n) (offsetof(struct seccomp_data, args[_n]))
#define syscall_nr (offsetof(struct seccomp_data, nr))

#if defined(__i386__)
#define REG_RESULT      REG_EAX
#define REG_SYSCALL     REG_EAX
#define REG_ARG0        REG_EBX
#define REG_ARG1        REG_ECX
#define REG_ARG2        REG_EDX
#define REG_ARG3        REG_ESI
#define REG_ARG4        REG_EDI
#define REG_ARG5        REG_EBP
#elif defined(__x86_64__)
#define REG_RESULT      REG_RAX
#define REG_SYSCALL     REG_RAX
#define REG_ARG0        REG_RDI
#define REG_ARG1        REG_RSI
#define REG_ARG2        REG_RDX
#define REG_ARG3        REG_R10
#define REG_ARG4        REG_R8
#define REG_ARG5        REG_R9
#endif

#ifndef PR_SET_NO_NEW_PRIVS
#define PR_SET_NO_NEW_PRIVS 38
#endif

#ifndef SYS_SECCOMP
#define SYS_SECCOMP 1
#endif

static void emulator(int nr, siginfo_t *info, void *void_context)
{
        ucontext_t *ctx = (ucontext_t *)(void_context);
        int syscall;
        char *buf;
        ssize_t bytes;
        size_t len;
        if (info->si_code != SYS_SECCOMP)
                return;
        if (!ctx)
                return;
        syscall = ctx->uc_mcontext.gregs[REG_SYSCALL];
        buf = (char *) ctx->uc_mcontext.gregs[REG_ARG1];
        len = (size_t) ctx->uc_mcontext.gregs[REG_ARG2];

        if (syscall != __NR_write)
                return;
        if (ctx->uc_mcontext.gregs[REG_ARG0] != STDERR_FILENO)
                return;
        /* Redirect stderr messages to stdout. Doesn't handle EINTR, etc */
        ctx->uc_mcontext.gregs[REG_RESULT] = -1;
        if (write(STDOUT_FILENO, "[ERR] ", 6) > 0) {
                bytes = write(STDOUT_FILENO, buf, len);
                ctx->uc_mcontext.gregs[REG_RESULT] = bytes;
        }
        return;
}

static int install_emulator(void)
{
        struct sigaction act;
        sigset_t mask;
        memset(&act, 0, sizeof(act));
        sigemptyset(&mask);
        sigaddset(&mask, SIGSYS);

        act.sa_sigaction = &emulator;
        act.sa_flags = SA_SIGINFO;
        if (sigaction(SIGSYS, &act, NULL) < 0) {
                perror("sigaction");
                return -1;
        }
        if (sigprocmask(SIG_UNBLOCK, &mask, NULL)) {
                perror("sigprocmask");
                return -1;
        }
        return 0;
}

static int install_filter(void)
{
        struct sock_filter filter[] = {
                /* Grab the system call number */
                BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_nr),
                /* Jump table for the allowed syscalls */
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_rt_sigreturn, 0, 1),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
#ifdef __NR_sigreturn
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_sigreturn, 0, 1),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
#endif
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit_group, 0, 1),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_exit, 0, 1),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_read, 1, 0),
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, __NR_write, 3, 2),

                /* Check that read is only using stdin. */
                BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)),
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDIN_FILENO, 4, 0),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL),

                /* Check that write is only using stdout */
                BPF_STMT(BPF_LD+BPF_W+BPF_ABS, syscall_arg(0)),
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDOUT_FILENO, 1, 0),
                /* Trap attempts to write to stderr */
                BPF_JUMP(BPF_JMP+BPF_JEQ+BPF_K, STDERR_FILENO, 1, 2),

                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_ALLOW),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_TRAP),
                BPF_STMT(BPF_RET+BPF_K, SECCOMP_RET_KILL),
        };
        struct sock_fprog prog = {
                .len = (unsigned short)(sizeof(filter)/sizeof(filter[0])),
                .filter = filter,
        };

        if (prctl(PR_SET_NO_NEW_PRIVS, 1, 0, 0, 0)) {
                perror("prctl(NO_NEW_PRIVS)");
                return 1;
        }


        if (prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &prog)) {
                perror("prctl");
                return 1;
        }
        return 0;
}

#define payload(_c) (_c), sizeof((_c))
int main(int argc, char **argv)
{
        char buf[4096];
        ssize_t bytes = 0;
        if (install_emulator())
                return 1;
        if (install_filter())
                return 1;
        syscall(__NR_write, STDOUT_FILENO,
                payload("OHAI! WHAT IS YOUR NAME? "));
        bytes = syscall(__NR_read, STDIN_FILENO, buf, sizeof(buf));
        syscall(__NR_write, STDOUT_FILENO, payload("HELLO, "));
        syscall(__NR_write, STDOUT_FILENO, buf, bytes);
        syscall(__NR_write, STDERR_FILENO,
                payload("Error message going to STDERR\n"));
        return 0;
}
#else   /* SUPPORTED_ARCH */
/*
 * This sample is x86-only.  Since kernel samples are compiled with the
 * host toolchain, a non-x86 host will result in using only the main()
 * below.
 */
int main(void)
{
        return 1;
}
#endif  /* SUPPORTED_ARCH */