| // SPDX-License-Identifier: GPL-2.0 |
| #define _GNU_SOURCE |
| #include <stdio.h> |
| #include <errno.h> |
| #include <pwd.h> |
| #include <grp.h> |
| #include <string.h> |
| #include <syscall.h> |
| #include <sys/capability.h> |
| #include <sys/types.h> |
| #include <sys/mount.h> |
| #include <sys/prctl.h> |
| #include <sys/wait.h> |
| #include <stdlib.h> |
| #include <unistd.h> |
| #include <fcntl.h> |
| #include <stdbool.h> |
| #include <stdarg.h> |
| |
| /* |
| * NOTES about this test: |
| * - requries libcap-dev to be installed on test system |
| * - requires securityfs to me mounted at /sys/kernel/security, e.g.: |
| * mount -n -t securityfs -o nodev,noexec,nosuid securityfs /sys/kernel/security |
| * - needs CONFIG_SECURITYFS and CONFIG_SAFESETID to be enabled |
| */ |
| |
| #ifndef CLONE_NEWUSER |
| # define CLONE_NEWUSER 0x10000000 |
| #endif |
| |
| #define ROOT_UGID 0 |
| #define RESTRICTED_PARENT_UGID 1 |
| #define ALLOWED_CHILD1_UGID 2 |
| #define ALLOWED_CHILD2_UGID 3 |
| #define NO_POLICY_UGID 4 |
| |
| #define UGID_POLICY_STRING "1:2\n1:3\n2:2\n3:3\n" |
| |
| char* add_uid_whitelist_policy_file = "/sys/kernel/security/safesetid/uid_allowlist_policy"; |
| char* add_gid_whitelist_policy_file = "/sys/kernel/security/safesetid/gid_allowlist_policy"; |
| |
| static void die(char *fmt, ...) |
| { |
| va_list ap; |
| va_start(ap, fmt); |
| vfprintf(stderr, fmt, ap); |
| va_end(ap); |
| exit(EXIT_FAILURE); |
| } |
| |
| static bool vmaybe_write_file(bool enoent_ok, char *filename, char *fmt, va_list ap) |
| { |
| char buf[4096]; |
| int fd; |
| ssize_t written; |
| int buf_len; |
| |
| buf_len = vsnprintf(buf, sizeof(buf), fmt, ap); |
| if (buf_len < 0) { |
| printf("vsnprintf failed: %s\n", |
| strerror(errno)); |
| return false; |
| } |
| if (buf_len >= sizeof(buf)) { |
| printf("vsnprintf output truncated\n"); |
| return false; |
| } |
| |
| fd = open(filename, O_WRONLY); |
| if (fd < 0) { |
| if ((errno == ENOENT) && enoent_ok) |
| return true; |
| return false; |
| } |
| written = write(fd, buf, buf_len); |
| if (written != buf_len) { |
| if (written >= 0) { |
| printf("short write to %s\n", filename); |
| return false; |
| } else { |
| printf("write to %s failed: %s\n", |
| filename, strerror(errno)); |
| return false; |
| } |
| } |
| if (close(fd) != 0) { |
| printf("close of %s failed: %s\n", |
| filename, strerror(errno)); |
| return false; |
| } |
| return true; |
| } |
| |
| static bool write_file(char *filename, char *fmt, ...) |
| { |
| va_list ap; |
| bool ret; |
| |
| va_start(ap, fmt); |
| ret = vmaybe_write_file(false, filename, fmt, ap); |
| va_end(ap); |
| |
| return ret; |
| } |
| |
| static void ensure_user_exists(uid_t uid) |
| { |
| struct passwd p; |
| |
| FILE *fd; |
| char name_str[10]; |
| |
| if (getpwuid(uid) == NULL) { |
| memset(&p,0x00,sizeof(p)); |
| fd=fopen("/etc/passwd","a"); |
| if (fd == NULL) |
| die("couldn't open file\n"); |
| if (fseek(fd, 0, SEEK_END)) |
| die("couldn't fseek\n"); |
| snprintf(name_str, 10, "user %d", uid); |
| p.pw_name=name_str; |
| p.pw_uid=uid; |
| p.pw_gid=uid; |
| p.pw_gecos="Test account"; |
| p.pw_dir="/dev/null"; |
| p.pw_shell="/bin/false"; |
| int value = putpwent(&p,fd); |
| if (value != 0) |
| die("putpwent failed\n"); |
| if (fclose(fd)) |
| die("fclose failed\n"); |
| } |
| } |
| |
| static void ensure_group_exists(gid_t gid) |
| { |
| struct group g; |
| |
| FILE *fd; |
| char name_str[10]; |
| |
| if (getgrgid(gid) == NULL) { |
| memset(&g,0x00,sizeof(g)); |
| fd=fopen("/etc/group","a"); |
| if (fd == NULL) |
| die("couldn't open group file\n"); |
| if (fseek(fd, 0, SEEK_END)) |
| die("couldn't fseek group file\n"); |
| snprintf(name_str, 10, "group %d", gid); |
| g.gr_name=name_str; |
| g.gr_gid=gid; |
| g.gr_passwd=NULL; |
| g.gr_mem=NULL; |
| int value = putgrent(&g,fd); |
| if (value != 0) |
| die("putgrent failed\n"); |
| if (fclose(fd)) |
| die("fclose failed\n"); |
| } |
| } |
| |
| static void ensure_securityfs_mounted(void) |
| { |
| int fd = open(add_uid_whitelist_policy_file, O_WRONLY); |
| if (fd < 0) { |
| if (errno == ENOENT) { |
| // Need to mount securityfs |
| if (mount("securityfs", "/sys/kernel/security", |
| "securityfs", 0, NULL) < 0) |
| die("mounting securityfs failed\n"); |
| } else { |
| die("couldn't find securityfs for unknown reason\n"); |
| } |
| } else { |
| if (close(fd) != 0) { |
| die("close of %s failed: %s\n", |
| add_uid_whitelist_policy_file, strerror(errno)); |
| } |
| } |
| } |
| |
| static void write_uid_policies() |
| { |
| static char *policy_str = UGID_POLICY_STRING; |
| ssize_t written; |
| int fd; |
| |
| fd = open(add_uid_whitelist_policy_file, O_WRONLY); |
| if (fd < 0) |
| die("can't open add_uid_whitelist_policy file\n"); |
| written = write(fd, policy_str, strlen(policy_str)); |
| if (written != strlen(policy_str)) { |
| if (written >= 0) { |
| die("short write to %s\n", add_uid_whitelist_policy_file); |
| } else { |
| die("write to %s failed: %s\n", |
| add_uid_whitelist_policy_file, strerror(errno)); |
| } |
| } |
| if (close(fd) != 0) { |
| die("close of %s failed: %s\n", |
| add_uid_whitelist_policy_file, strerror(errno)); |
| } |
| } |
| |
| static void write_gid_policies() |
| { |
| static char *policy_str = UGID_POLICY_STRING; |
| ssize_t written; |
| int fd; |
| |
| fd = open(add_gid_whitelist_policy_file, O_WRONLY); |
| if (fd < 0) |
| die("can't open add_gid_whitelist_policy file\n"); |
| written = write(fd, policy_str, strlen(policy_str)); |
| if (written != strlen(policy_str)) { |
| if (written >= 0) { |
| die("short write to %s\n", add_gid_whitelist_policy_file); |
| } else { |
| die("write to %s failed: %s\n", |
| add_gid_whitelist_policy_file, strerror(errno)); |
| } |
| } |
| if (close(fd) != 0) { |
| die("close of %s failed: %s\n", |
| add_gid_whitelist_policy_file, strerror(errno)); |
| } |
| } |
| |
| |
| static bool test_userns(bool expect_success) |
| { |
| uid_t uid; |
| char map_file_name[32]; |
| size_t sz = sizeof(map_file_name); |
| pid_t cpid; |
| bool success; |
| |
| uid = getuid(); |
| |
| int clone_flags = CLONE_NEWUSER; |
| cpid = syscall(SYS_clone, clone_flags, NULL); |
| if (cpid == -1) { |
| printf("clone failed"); |
| return false; |
| } |
| |
| if (cpid == 0) { /* Code executed by child */ |
| // Give parent 1 second to write map file |
| sleep(1); |
| exit(EXIT_SUCCESS); |
| } else { /* Code executed by parent */ |
| if(snprintf(map_file_name, sz, "/proc/%d/uid_map", cpid) < 0) { |
| printf("preparing file name string failed"); |
| return false; |
| } |
| success = write_file(map_file_name, "0 %d 1", uid); |
| return success == expect_success; |
| } |
| |
| printf("should not reach here"); |
| return false; |
| } |
| |
| static void test_setuid(uid_t child_uid, bool expect_success) |
| { |
| pid_t cpid, w; |
| int wstatus; |
| |
| cpid = fork(); |
| if (cpid == -1) { |
| die("fork\n"); |
| } |
| |
| if (cpid == 0) { /* Code executed by child */ |
| if (setuid(child_uid) < 0) |
| exit(EXIT_FAILURE); |
| if (getuid() == child_uid) |
| exit(EXIT_SUCCESS); |
| else |
| exit(EXIT_FAILURE); |
| } else { /* Code executed by parent */ |
| do { |
| w = waitpid(cpid, &wstatus, WUNTRACED | WCONTINUED); |
| if (w == -1) { |
| die("waitpid\n"); |
| } |
| |
| if (WIFEXITED(wstatus)) { |
| if (WEXITSTATUS(wstatus) == EXIT_SUCCESS) { |
| if (expect_success) { |
| return; |
| } else { |
| die("unexpected success\n"); |
| } |
| } else { |
| if (expect_success) { |
| die("unexpected failure\n"); |
| } else { |
| return; |
| } |
| } |
| } else if (WIFSIGNALED(wstatus)) { |
| if (WTERMSIG(wstatus) == 9) { |
| if (expect_success) |
| die("killed unexpectedly\n"); |
| else |
| return; |
| } else { |
| die("unexpected signal: %d\n", wstatus); |
| } |
| } else { |
| die("unexpected status: %d\n", wstatus); |
| } |
| } while (!WIFEXITED(wstatus) && !WIFSIGNALED(wstatus)); |
| } |
| |
| die("should not reach here\n"); |
| } |
| |
| static void test_setgid(gid_t child_gid, bool expect_success) |
| { |
| pid_t cpid, w; |
| int wstatus; |
| |
| cpid = fork(); |
| if (cpid == -1) { |
| die("fork\n"); |
| } |
| |
| if (cpid == 0) { /* Code executed by child */ |
| if (setgid(child_gid) < 0) |
| exit(EXIT_FAILURE); |
| if (getgid() == child_gid) |
| exit(EXIT_SUCCESS); |
| else |
| exit(EXIT_FAILURE); |
| } else { /* Code executed by parent */ |
| do { |
| w = waitpid(cpid, &wstatus, WUNTRACED | WCONTINUED); |
| if (w == -1) { |
| die("waitpid\n"); |
| } |
| |
| if (WIFEXITED(wstatus)) { |
| if (WEXITSTATUS(wstatus) == EXIT_SUCCESS) { |
| if (expect_success) { |
| return; |
| } else { |
| die("unexpected success\n"); |
| } |
| } else { |
| if (expect_success) { |
| die("unexpected failure\n"); |
| } else { |
| return; |
| } |
| } |
| } else if (WIFSIGNALED(wstatus)) { |
| if (WTERMSIG(wstatus) == 9) { |
| if (expect_success) |
| die("killed unexpectedly\n"); |
| else |
| return; |
| } else { |
| die("unexpected signal: %d\n", wstatus); |
| } |
| } else { |
| die("unexpected status: %d\n", wstatus); |
| } |
| } while (!WIFEXITED(wstatus) && !WIFSIGNALED(wstatus)); |
| } |
| |
| die("should not reach here\n"); |
| } |
| |
| static void test_setgroups(gid_t* child_groups, size_t len, bool expect_success) |
| { |
| pid_t cpid, w; |
| int wstatus; |
| gid_t groupset[len]; |
| int i, j; |
| |
| cpid = fork(); |
| if (cpid == -1) { |
| die("fork\n"); |
| } |
| |
| if (cpid == 0) { /* Code executed by child */ |
| if (setgroups(len, child_groups) != 0) |
| exit(EXIT_FAILURE); |
| if (getgroups(len, groupset) != len) |
| exit(EXIT_FAILURE); |
| for (i = 0; i < len; i++) { |
| for (j = 0; j < len; j++) { |
| if (child_groups[i] == groupset[j]) |
| break; |
| if (j == len - 1) |
| exit(EXIT_FAILURE); |
| } |
| } |
| exit(EXIT_SUCCESS); |
| } else { /* Code executed by parent */ |
| do { |
| w = waitpid(cpid, &wstatus, WUNTRACED | WCONTINUED); |
| if (w == -1) { |
| die("waitpid\n"); |
| } |
| |
| if (WIFEXITED(wstatus)) { |
| if (WEXITSTATUS(wstatus) == EXIT_SUCCESS) { |
| if (expect_success) { |
| return; |
| } else { |
| die("unexpected success\n"); |
| } |
| } else { |
| if (expect_success) { |
| die("unexpected failure\n"); |
| } else { |
| return; |
| } |
| } |
| } else if (WIFSIGNALED(wstatus)) { |
| if (WTERMSIG(wstatus) == 9) { |
| if (expect_success) |
| die("killed unexpectedly\n"); |
| else |
| return; |
| } else { |
| die("unexpected signal: %d\n", wstatus); |
| } |
| } else { |
| die("unexpected status: %d\n", wstatus); |
| } |
| } while (!WIFEXITED(wstatus) && !WIFSIGNALED(wstatus)); |
| } |
| |
| die("should not reach here\n"); |
| } |
| |
| |
| static void ensure_users_exist(void) |
| { |
| ensure_user_exists(ROOT_UGID); |
| ensure_user_exists(RESTRICTED_PARENT_UGID); |
| ensure_user_exists(ALLOWED_CHILD1_UGID); |
| ensure_user_exists(ALLOWED_CHILD2_UGID); |
| ensure_user_exists(NO_POLICY_UGID); |
| } |
| |
| static void ensure_groups_exist(void) |
| { |
| ensure_group_exists(ROOT_UGID); |
| ensure_group_exists(RESTRICTED_PARENT_UGID); |
| ensure_group_exists(ALLOWED_CHILD1_UGID); |
| ensure_group_exists(ALLOWED_CHILD2_UGID); |
| ensure_group_exists(NO_POLICY_UGID); |
| } |
| |
| static void drop_caps(bool setid_retained) |
| { |
| cap_value_t cap_values[] = {CAP_SETUID, CAP_SETGID}; |
| cap_t caps; |
| |
| caps = cap_get_proc(); |
| if (setid_retained) |
| cap_set_flag(caps, CAP_EFFECTIVE, 2, cap_values, CAP_SET); |
| else |
| cap_clear(caps); |
| cap_set_proc(caps); |
| cap_free(caps); |
| } |
| |
| int main(int argc, char **argv) |
| { |
| ensure_groups_exist(); |
| ensure_users_exist(); |
| ensure_securityfs_mounted(); |
| write_uid_policies(); |
| write_gid_policies(); |
| |
| if (prctl(PR_SET_KEEPCAPS, 1L)) |
| die("Error with set keepcaps\n"); |
| |
| // First test to make sure we can write userns mappings from a non-root |
| // user that doesn't have any restrictions (as long as it has |
| // CAP_SETUID); |
| if (setgid(NO_POLICY_UGID) < 0) |
| die("Error with set gid(%d)\n", NO_POLICY_UGID); |
| if (setuid(NO_POLICY_UGID) < 0) |
| die("Error with set uid(%d)\n", NO_POLICY_UGID); |
| // Take away all but setid caps |
| drop_caps(true); |
| // Need PR_SET_DUMPABLE flag set so we can write /proc/[pid]/uid_map |
| // from non-root parent process. |
| if (prctl(PR_SET_DUMPABLE, 1, 0, 0, 0)) |
| die("Error with set dumpable\n"); |
| if (!test_userns(true)) { |
| die("test_userns failed when it should work\n"); |
| } |
| |
| // Now switch to a user/group with restrictions |
| if (setgid(RESTRICTED_PARENT_UGID) < 0) |
| die("Error with set gid(%d)\n", RESTRICTED_PARENT_UGID); |
| if (setuid(RESTRICTED_PARENT_UGID) < 0) |
| die("Error with set uid(%d)\n", RESTRICTED_PARENT_UGID); |
| |
| test_setuid(ROOT_UGID, false); |
| test_setuid(ALLOWED_CHILD1_UGID, true); |
| test_setuid(ALLOWED_CHILD2_UGID, true); |
| test_setuid(NO_POLICY_UGID, false); |
| |
| test_setgid(ROOT_UGID, false); |
| test_setgid(ALLOWED_CHILD1_UGID, true); |
| test_setgid(ALLOWED_CHILD2_UGID, true); |
| test_setgid(NO_POLICY_UGID, false); |
| |
| gid_t allowed_supp_groups[2] = {ALLOWED_CHILD1_UGID, ALLOWED_CHILD2_UGID}; |
| gid_t disallowed_supp_groups[2] = {ROOT_UGID, NO_POLICY_UGID}; |
| test_setgroups(allowed_supp_groups, 2, true); |
| test_setgroups(disallowed_supp_groups, 2, false); |
| |
| if (!test_userns(false)) { |
| die("test_userns worked when it should fail\n"); |
| } |
| |
| // Now take away all caps |
| drop_caps(false); |
| test_setuid(2, false); |
| test_setuid(3, false); |
| test_setuid(4, false); |
| test_setgid(2, false); |
| test_setgid(3, false); |
| test_setgid(4, false); |
| |
| // NOTE: this test doesn't clean up users that were created in |
| // /etc/passwd or flush policies that were added to the LSM. |
| printf("test successful!\n"); |
| return EXIT_SUCCESS; |
| } |