root/usr.sbin/bsdinstall/runconsoles/child.c
/*-
 * SPDX-License-Identifier: BSD-2-Clause
 *
 * Copyright (c) 2022 Jessica Clarke <jrtc27@FreeBSD.org>
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

#include <sys/param.h>
#include <sys/errno.h>
#include <sys/procctl.h>
#include <sys/queue.h>
#include <sys/resource.h>
#include <sys/sysctl.h>
#include <sys/wait.h>

#include <err.h>
#include <errno.h>
#include <fcntl.h>
#include <signal.h>
#include <stdarg.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sysexits.h>
#include <termios.h>
#include <ttyent.h>
#include <unistd.h>

#include "common.h"
#include "child.h"

/* -1: not started, 0: reaped */
static volatile pid_t grandchild_pid = -1;
static volatile int grandchild_status;

static struct pipe_barrier wait_grandchild_barrier;
static struct pipe_barrier wait_all_descendants_barrier;

static void
kill_descendants(int sig)
{
        struct procctl_reaper_kill rk;

        rk.rk_sig = sig;
        rk.rk_flags = 0;
        procctl(P_PID, getpid(), PROC_REAP_KILL, &rk);
}

static void
sigalrm_handler(int sig __unused)
{
        int saved_errno;

        saved_errno = errno;
        kill_descendants(SIGKILL);
        errno = saved_errno;
}

static void
wait_all_descendants(void)
{
        sigset_t set, oset;

        err_set_exit(NULL);

        /*
         * We may be run in a context where SIGALRM is blocked; temporarily
         * unblock so we can SIGKILL. Similarly, SIGCHLD may be blocked, but if
         * we're waiting on the pipe we need to make sure it's not.
         */
        sigemptyset(&set);
        sigaddset(&set, SIGALRM);
        sigaddset(&set, SIGCHLD);
        sigprocmask(SIG_UNBLOCK, &set, &oset);
        alarm(KILL_TIMEOUT);
        pipe_barrier_wait(&wait_all_descendants_barrier);
        alarm(0);
        sigprocmask(SIG_SETMASK, &oset, NULL);
}

static void
sigchld_handler(int sig __unused)
{
        int status, saved_errno;
        pid_t pid;

        saved_errno = errno;

        while ((void)(pid = waitpid(-1, &status, WNOHANG)),
            pid != -1 && pid != 0) {
                /* NB: No need to check grandchild_pid due to the pid checks */
                if (pid == grandchild_pid) {
                        grandchild_status = status;
                        grandchild_pid = 0;
                        pipe_barrier_ready(&wait_grandchild_barrier);
                }
        }

        /*
         * Another process calling kill(..., SIGCHLD) could cause us to get
         * here before we've spawned the grandchild; only ready when we have no
         * children if the grandchild has been reaped.
         */
        if (pid == -1 && errno == ECHILD && grandchild_pid == 0)
                pipe_barrier_ready(&wait_all_descendants_barrier);

        errno = saved_errno;
}

static void
exit_signal_handler(int sig)
{
        int saved_errno;

        /*
         * If we get killed before we've started the grandchild then just exit
         * with that signal, otherwise kill all our descendants with that
         * signal and let the main program pick up the grandchild's death.
         */
        if (grandchild_pid == -1) {
                reproduce_signal_death(sig);
                exit(EXIT_FAILURE);
        }

        saved_errno = errno;
        kill_descendants(sig);
        errno = saved_errno;
}

static void
kill_wait_all_descendants(int sig)
{
        kill_descendants(sig);
        wait_all_descendants();
}

static void
kill_wait_all_descendants_err_exit(int eval __unused)
{
        kill_wait_all_descendants(SIGTERM);
}

static void __dead2
grandchild_run(const char **argv, const sigset_t *oset)
{
        sig_t orig;

        /* Restore signals */
        orig = signal(SIGALRM, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGALRM");
        orig = signal(SIGCHLD, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGCHLD");
        orig = signal(SIGTERM, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGTERM");
        orig = signal(SIGINT, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGINT");
        orig = signal(SIGQUIT, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGQUIT");
        orig = signal(SIGPIPE, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGPIPE");
        orig = signal(SIGTTOU, SIG_DFL);
        if (orig == SIG_ERR)
                err(EX_OSERR, "could not restore SIGTTOU");

        /* Now safe to unmask signals */
        sigprocmask(SIG_SETMASK, oset, NULL);

        /* Only run with stdin/stdout/stderr */
        closefrom(3);

        /* Ready to execute the requested program */
        execvp(argv[0], __DECONST(char * const *, argv));
        err(EX_OSERR, "cannot execvp %s", argv[0]);
}

static int
wait_grandchild_descendants(void)
{
        pipe_barrier_wait(&wait_grandchild_barrier);

        /*
         * Once the grandchild itself has exited, kill any lingering
         * descendants and wait until we've reaped them all.
         */
        kill_wait_all_descendants(SIGTERM);

        if (grandchild_pid != 0)
                errx(EX_SOFTWARE, "failed to reap grandchild");

        return (grandchild_status);
}

void
child_leader_run(const char *name, int fd, bool new_session, const char **argv,
    const sigset_t *oset, struct pipe_barrier *start_children_barrier)
{
        struct pipe_barrier start_grandchild_barrier;
        pid_t pid, sid, pgid;
        struct sigaction sa;
        int error, status;
        sigset_t set;

        setproctitle("%s [%s]", getprogname(), name);

        error = procctl(P_PID, getpid(), PROC_REAP_ACQUIRE, NULL);
        if (error != 0)
                err(EX_OSERR, "could not acquire reaper status");

        /*
         * Set up our own signal handlers for everything the parent overrides
         * other than SIGPIPE and SIGTTOU which we leave as ignored, since we
         * also use pipe-based synchronisation and want to be able to print
         * errors.
         */
        sa.sa_flags = SA_RESTART;
        sa.sa_handler = sigchld_handler;
        sigfillset(&sa.sa_mask);
        error = sigaction(SIGCHLD, &sa, NULL);
        if (error != 0)
                err(EX_OSERR, "could not enable SIGCHLD handler");
        sa.sa_handler = sigalrm_handler;
        error = sigaction(SIGALRM, &sa, NULL);
        if (error != 0)
                err(EX_OSERR, "could not enable SIGALRM handler");
        sa.sa_handler = exit_signal_handler;
        error = sigaction(SIGTERM, &sa, NULL);
        if (error != 0)
                err(EX_OSERR, "could not enable SIGTERM handler");
        error = sigaction(SIGINT, &sa, NULL);
        if (error != 0)
                err(EX_OSERR, "could not enable SIGINT handler");
        error = sigaction(SIGQUIT, &sa, NULL);
        if (error != 0)
                err(EX_OSERR, "could not enable SIGQUIT handler");

        /*
         * Now safe to unmask signals. Note that creating the barriers used by
         * the SIGCHLD handler with signals unmasked is safe since they won't
         * be used if the grandchild hasn't been forked (and reaped), which
         * comes later.
         */
        sigprocmask(SIG_SETMASK, oset, NULL);

        error = pipe_barrier_init(&start_grandchild_barrier);
        if (error != 0)
                err(EX_OSERR, "could not create start grandchild barrier");

        error = pipe_barrier_init(&wait_grandchild_barrier);
        if (error != 0)
                err(EX_OSERR, "could not create wait grandchild barrier");

        error = pipe_barrier_init(&wait_all_descendants_barrier);
        if (error != 0)
                err(EX_OSERR, "could not create wait all descendants barrier");

        /*
         * Create a new session if this is on a different terminal to
         * the current one, otherwise just create a new process group to keep
         * things as similar as possible between the two cases.
         */
        if (new_session) {
                sid = setsid();
                pgid = sid;
                if (sid == -1)
                        err(EX_OSERR, "could not create session");
        } else {
                sid = -1;
                pgid = getpid();
                error = setpgid(0, pgid);
                if (error == -1)
                        err(EX_OSERR, "could not create process group");
        }

        /* Wait until parent is ready for us to start */
        pipe_barrier_destroy_ready(start_children_barrier);
        pipe_barrier_wait(start_children_barrier);

        /*
         * Use the console for stdin/stdout/stderr.
         *
         * NB: dup2(2) is a no-op if the two fds are equal, and the call to
         * closefrom(2) later in the grandchild will close the fd if it isn't
         * one of stdin/stdout/stderr already. This means we do not need to
         * handle that special case differently.
         */
        error = dup2(fd, STDIN_FILENO);
        if (error == -1)
                err(EX_IOERR, "could not dup %s to stdin", name);
        error = dup2(fd, STDOUT_FILENO);
        if (error == -1)
                err(EX_IOERR, "could not dup %s to stdout", name);
        error = dup2(fd, STDERR_FILENO);
        if (error == -1)
                err(EX_IOERR, "could not dup %s to stderr", name);

        /*
         * If we created a new session, make the console our controlling
         * terminal. Either way, also make this the foreground process group.
         */
        if (new_session) {
                error = tcsetsid(STDIN_FILENO, sid);
                if (error != 0)
                        err(EX_IOERR, "could not set session for %s", name);
        } else {
                error = tcsetpgrp(STDIN_FILENO, pgid);
                if (error != 0)
                        err(EX_IOERR, "could not set process group for %s",
                            name);
        }

        /*
         * Temporarily block signals again; forking, setting grandchild_pid and
         * calling err_set_exit need to all be atomic for similar reasons as
         * the parent when forking us.
         */
        sigfillset(&set);
        sigprocmask(SIG_BLOCK, &set, NULL);
        pid = fork();
        if (pid == -1)
                err(EX_OSERR, "could not fork");

        if (pid == 0) {
                /*
                 * We need to destroy the ready ends so we don't block these
                 * child leader-only self-pipes, and might as well destroy the
                 * wait ends too given we're not going to use them.
                 */
                pipe_barrier_destroy(&wait_grandchild_barrier);
                pipe_barrier_destroy(&wait_all_descendants_barrier);

                /* Wait until the parent has put us in a new process group */
                pipe_barrier_destroy_ready(&start_grandchild_barrier);
                pipe_barrier_wait(&start_grandchild_barrier);
                grandchild_run(argv, oset);
        }

        grandchild_pid = pid;

        /*
         * Now the grandchild exists make sure to clean it up, and any of its
         * descendants, on exit.
         */
        err_set_exit(kill_wait_all_descendants_err_exit);

        sigprocmask(SIG_SETMASK, oset, NULL);

        /* Start the grandchild and wait for it and its descendants to exit */
        pipe_barrier_ready(&start_grandchild_barrier);

        status = wait_grandchild_descendants();

        if (WIFSIGNALED(status))
                reproduce_signal_death(WTERMSIG(status));

        if (WIFEXITED(status))
                exit(WEXITSTATUS(status));

        exit(EXIT_FAILURE);
}