root/tools/testing/selftests/mount/unprivileged-remount-test.c
// SPDX-License-Identifier: GPL-2.0
#define _GNU_SOURCE
#include <sched.h>
#include <stdio.h>
#include <errno.h>
#include <string.h>
#include <sys/types.h>
#include <sys/mount.h>
#include <sys/wait.h>
#include <sys/vfs.h>
#include <sys/statvfs.h>
#include <stdlib.h>
#include <unistd.h>
#include <fcntl.h>
#include <grp.h>
#include <stdbool.h>
#include <stdarg.h>

#ifndef CLONE_NEWNS
# define CLONE_NEWNS 0x00020000
#endif
#ifndef CLONE_NEWUTS
# define CLONE_NEWUTS 0x04000000
#endif
#ifndef CLONE_NEWIPC
# define CLONE_NEWIPC 0x08000000
#endif
#ifndef CLONE_NEWNET
# define CLONE_NEWNET 0x40000000
#endif
#ifndef CLONE_NEWUSER
# define CLONE_NEWUSER 0x10000000
#endif
#ifndef CLONE_NEWPID
# define CLONE_NEWPID 0x20000000
#endif

#ifndef MS_REC
# define MS_REC 16384
#endif
#ifndef MS_RELATIME
# define MS_RELATIME (1 << 21)
#endif
#ifndef MS_STRICTATIME
# define MS_STRICTATIME (1 << 24)
#endif

static void die(char *fmt, ...)
{
        va_list ap;
        va_start(ap, fmt);
        vfprintf(stderr, fmt, ap);
        va_end(ap);
        exit(EXIT_FAILURE);
}

static void vmaybe_write_file(bool enoent_ok, char *filename, char *fmt, va_list ap)
{
        char buf[4096];
        int fd;
        ssize_t written;
        int buf_len;

        buf_len = vsnprintf(buf, sizeof(buf), fmt, ap);
        if (buf_len < 0) {
                die("vsnprintf failed: %s\n",
                    strerror(errno));
        }
        if (buf_len >= sizeof(buf)) {
                die("vsnprintf output truncated\n");
        }

        fd = open(filename, O_WRONLY);
        if (fd < 0) {
                if ((errno == ENOENT) && enoent_ok)
                        return;
                die("open of %s failed: %s\n",
                    filename, strerror(errno));
        }
        written = write(fd, buf, buf_len);
        if (written != buf_len) {
                if (written >= 0) {
                        die("short write to %s\n", filename);
                } else {
                        die("write to %s failed: %s\n",
                                filename, strerror(errno));
                }
        }
        if (close(fd) != 0) {
                die("close of %s failed: %s\n",
                        filename, strerror(errno));
        }
}

static void maybe_write_file(char *filename, char *fmt, ...)
{
        va_list ap;

        va_start(ap, fmt);
        vmaybe_write_file(true, filename, fmt, ap);
        va_end(ap);

}

static void write_file(char *filename, char *fmt, ...)
{
        va_list ap;

        va_start(ap, fmt);
        vmaybe_write_file(false, filename, fmt, ap);
        va_end(ap);

}

static int read_mnt_flags(const char *path)
{
        int ret;
        struct statvfs stat;
        int mnt_flags;

        ret = statvfs(path, &stat);
        if (ret != 0) {
                die("statvfs of %s failed: %s\n",
                        path, strerror(errno));
        }
        if (stat.f_flag & ~(ST_RDONLY | ST_NOSUID | ST_NODEV | \
                        ST_NOEXEC | ST_NOATIME | ST_NODIRATIME | ST_RELATIME | \
                        ST_SYNCHRONOUS | ST_MANDLOCK)) {
                die("Unrecognized mount flags\n");
        }
        mnt_flags = 0;
        if (stat.f_flag & ST_RDONLY)
                mnt_flags |= MS_RDONLY;
        if (stat.f_flag & ST_NOSUID)
                mnt_flags |= MS_NOSUID;
        if (stat.f_flag & ST_NODEV)
                mnt_flags |= MS_NODEV;
        if (stat.f_flag & ST_NOEXEC)
                mnt_flags |= MS_NOEXEC;
        if (stat.f_flag & ST_NOATIME)
                mnt_flags |= MS_NOATIME;
        if (stat.f_flag & ST_NODIRATIME)
                mnt_flags |= MS_NODIRATIME;
        if (stat.f_flag & ST_RELATIME)
                mnt_flags |= MS_RELATIME;
        if (stat.f_flag & ST_SYNCHRONOUS)
                mnt_flags |= MS_SYNCHRONOUS;
        if (stat.f_flag & ST_MANDLOCK)
                mnt_flags |= ST_MANDLOCK;

        return mnt_flags;
}

static void create_and_enter_userns(void)
{
        uid_t uid;
        gid_t gid;

        uid = getuid();
        gid = getgid();

        if (unshare(CLONE_NEWUSER) !=0) {
                die("unshare(CLONE_NEWUSER) failed: %s\n",
                        strerror(errno));
        }

        maybe_write_file("/proc/self/setgroups", "deny");
        write_file("/proc/self/uid_map", "0 %d 1", uid);
        write_file("/proc/self/gid_map", "0 %d 1", gid);

        if (setgid(0) != 0) {
                die ("setgid(0) failed %s\n",
                        strerror(errno));
        }
        if (setuid(0) != 0) {
                die("setuid(0) failed %s\n",
                        strerror(errno));
        }
}

static
bool test_unpriv_remount(const char *fstype, const char *mount_options,
                         int mount_flags, int remount_flags, int invalid_flags)
{
        pid_t child;

        child = fork();
        if (child == -1) {
                die("fork failed: %s\n",
                        strerror(errno));
        }
        if (child != 0) { /* parent */
                pid_t pid;
                int status;
                pid = waitpid(child, &status, 0);
                if (pid == -1) {
                        die("waitpid failed: %s\n",
                                strerror(errno));
                }
                if (pid != child) {
                        die("waited for %d got %d\n",
                                child, pid);
                }
                if (!WIFEXITED(status)) {
                        die("child did not terminate cleanly\n");
                }
                return WEXITSTATUS(status) == EXIT_SUCCESS;
        }

        create_and_enter_userns();
        if (unshare(CLONE_NEWNS) != 0) {
                die("unshare(CLONE_NEWNS) failed: %s\n",
                        strerror(errno));
        }

        if (mount("testing", "/tmp", fstype, mount_flags, mount_options) != 0) {
                die("mount of %s with options '%s' on /tmp failed: %s\n",
                    fstype,
                    mount_options? mount_options : "",
                    strerror(errno));
        }

        create_and_enter_userns();

        if (unshare(CLONE_NEWNS) != 0) {
                die("unshare(CLONE_NEWNS) failed: %s\n",
                        strerror(errno));
        }

        if (mount("/tmp", "/tmp", "none",
                  MS_REMOUNT | MS_BIND | remount_flags, NULL) != 0) {
                /* system("cat /proc/self/mounts"); */
                die("remount of /tmp failed: %s\n",
                    strerror(errno));
        }

        if (mount("/tmp", "/tmp", "none",
                  MS_REMOUNT | MS_BIND | invalid_flags, NULL) == 0) {
                /* system("cat /proc/self/mounts"); */
                die("remount of /tmp with invalid flags "
                    "succeeded unexpectedly\n");
        }
        exit(EXIT_SUCCESS);
}

static bool test_unpriv_remount_simple(int mount_flags)
{
        return test_unpriv_remount("ramfs", NULL, mount_flags, mount_flags, 0);
}

static bool test_unpriv_remount_atime(int mount_flags, int invalid_flags)
{
        return test_unpriv_remount("ramfs", NULL, mount_flags, mount_flags,
                                   invalid_flags);
}

static bool test_priv_mount_unpriv_remount(void)
{
        pid_t child;
        int ret;
        const char *orig_path = "/dev";
        const char *dest_path = "/tmp";
        int orig_mnt_flags, remount_mnt_flags;

        child = fork();
        if (child == -1) {
                die("fork failed: %s\n",
                        strerror(errno));
        }
        if (child != 0) { /* parent */
                pid_t pid;
                int status;
                pid = waitpid(child, &status, 0);
                if (pid == -1) {
                        die("waitpid failed: %s\n",
                                strerror(errno));
                }
                if (pid != child) {
                        die("waited for %d got %d\n",
                                child, pid);
                }
                if (!WIFEXITED(status)) {
                        die("child did not terminate cleanly\n");
                }
                return WEXITSTATUS(status) == EXIT_SUCCESS;
        }

        orig_mnt_flags = read_mnt_flags(orig_path);

        create_and_enter_userns();
        ret = unshare(CLONE_NEWNS);
        if (ret != 0) {
                die("unshare(CLONE_NEWNS) failed: %s\n",
                        strerror(errno));
        }

        ret = mount(orig_path, dest_path, "bind", MS_BIND | MS_REC, NULL);
        if (ret != 0) {
                die("recursive bind mount of %s onto %s failed: %s\n",
                        orig_path, dest_path, strerror(errno));
        }

        ret = mount(dest_path, dest_path, "none",
                    MS_REMOUNT | MS_BIND | orig_mnt_flags , NULL);
        if (ret != 0) {
                /* system("cat /proc/self/mounts"); */
                die("remount of /tmp failed: %s\n",
                    strerror(errno));
        }

        remount_mnt_flags = read_mnt_flags(dest_path);
        if (orig_mnt_flags != remount_mnt_flags) {
                die("Mount flags unexpectedly changed during remount of %s originally mounted on %s\n",
                        dest_path, orig_path);
        }
        exit(EXIT_SUCCESS);
}

int main(int argc, char **argv)
{
        if (!test_unpriv_remount_simple(MS_RDONLY)) {
                die("MS_RDONLY malfunctions\n");
        }
        if (!test_unpriv_remount("devpts", "newinstance", MS_NODEV, MS_NODEV, 0)) {
                die("MS_NODEV malfunctions\n");
        }
        if (!test_unpriv_remount_simple(MS_NOSUID)) {
                die("MS_NOSUID malfunctions\n");
        }
        if (!test_unpriv_remount_simple(MS_NOEXEC)) {
                die("MS_NOEXEC malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_RELATIME,
                                       MS_NOATIME))
        {
                die("MS_RELATIME malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_STRICTATIME,
                                       MS_NOATIME))
        {
                die("MS_STRICTATIME malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_NOATIME,
                                       MS_STRICTATIME))
        {
                die("MS_NOATIME malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_RELATIME|MS_NODIRATIME,
                                       MS_NOATIME))
        {
                die("MS_RELATIME|MS_NODIRATIME malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_STRICTATIME|MS_NODIRATIME,
                                       MS_NOATIME))
        {
                die("MS_STRICTATIME|MS_NODIRATIME malfunctions\n");
        }
        if (!test_unpriv_remount_atime(MS_NOATIME|MS_NODIRATIME,
                                       MS_STRICTATIME))
        {
                die("MS_NOATIME|MS_DIRATIME malfunctions\n");
        }
        if (!test_unpriv_remount("ramfs", NULL, MS_STRICTATIME, 0, MS_NOATIME))
        {
                die("Default atime malfunctions\n");
        }
        if (!test_priv_mount_unpriv_remount()) {
                die("Mount flags unexpectedly changed after remount\n");
        }
        return EXIT_SUCCESS;
}