| // SPDX-License-Identifier: GPL-2.0 |
| |
| /* |
| * Based on Christian Brauner's clone3() example. |
| * These tests are assuming to be running in the host's |
| * PID namespace. |
| */ |
| |
| #define _GNU_SOURCE |
| #include <errno.h> |
| #include <linux/types.h> |
| #include <linux/sched.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <stdbool.h> |
| #include <sys/syscall.h> |
| #include <sys/types.h> |
| #include <sys/un.h> |
| #include <sys/wait.h> |
| #include <unistd.h> |
| #include <sched.h> |
| |
| #include "../kselftest.h" |
| #include "clone3_selftests.h" |
| |
| #ifndef MAX_PID_NS_LEVEL |
| #define MAX_PID_NS_LEVEL 32 |
| #endif |
| |
| static int pipe_1[2]; |
| static int pipe_2[2]; |
| |
| static void child_exit(int ret) |
| { |
| fflush(stdout); |
| fflush(stderr); |
| _exit(ret); |
| } |
| |
| static int call_clone3_set_tid(pid_t *set_tid, |
| size_t set_tid_size, |
| int flags, |
| int expected_pid, |
| bool wait_for_it) |
| { |
| int status; |
| pid_t pid = -1; |
| |
| struct __clone_args args = { |
| .flags = flags, |
| .exit_signal = SIGCHLD, |
| .set_tid = ptr_to_u64(set_tid), |
| .set_tid_size = set_tid_size, |
| }; |
| |
| pid = sys_clone3(&args, sizeof(args)); |
| if (pid < 0) { |
| ksft_print_msg("%s - Failed to create new process\n", |
| strerror(errno)); |
| return -errno; |
| } |
| |
| if (pid == 0) { |
| int ret; |
| char tmp = 0; |
| int exit_code = EXIT_SUCCESS; |
| |
| ksft_print_msg("I am the child, my PID is %d (expected %d)\n", |
| getpid(), set_tid[0]); |
| if (wait_for_it) { |
| ksft_print_msg("[%d] Child is ready and waiting\n", |
| getpid()); |
| |
| /* Signal the parent that the child is ready */ |
| close(pipe_1[0]); |
| ret = write(pipe_1[1], &tmp, 1); |
| if (ret != 1) { |
| ksft_print_msg( |
| "Writing to pipe returned %d", ret); |
| exit_code = EXIT_FAILURE; |
| } |
| close(pipe_1[1]); |
| close(pipe_2[1]); |
| ret = read(pipe_2[0], &tmp, 1); |
| if (ret != 1) { |
| ksft_print_msg( |
| "Reading from pipe returned %d", ret); |
| exit_code = EXIT_FAILURE; |
| } |
| close(pipe_2[0]); |
| } |
| |
| if (set_tid[0] != getpid()) |
| child_exit(EXIT_FAILURE); |
| child_exit(exit_code); |
| } |
| |
| if (expected_pid == 0 || expected_pid == pid) { |
| ksft_print_msg("I am the parent (%d). My child's pid is %d\n", |
| getpid(), pid); |
| } else { |
| ksft_print_msg( |
| "Expected child pid %d does not match actual pid %d\n", |
| expected_pid, pid); |
| return -1; |
| } |
| |
| if (waitpid(pid, &status, 0) < 0) { |
| ksft_print_msg("Child returned %s\n", strerror(errno)); |
| return -errno; |
| } |
| |
| if (!WIFEXITED(status)) |
| return -1; |
| |
| return WEXITSTATUS(status); |
| } |
| |
| static void test_clone3_set_tid(pid_t *set_tid, |
| size_t set_tid_size, |
| int flags, |
| int expected, |
| int expected_pid, |
| bool wait_for_it) |
| { |
| int ret; |
| |
| ksft_print_msg( |
| "[%d] Trying clone3() with CLONE_SET_TID to %d and 0x%x\n", |
| getpid(), set_tid[0], flags); |
| ret = call_clone3_set_tid(set_tid, set_tid_size, flags, expected_pid, |
| wait_for_it); |
| ksft_print_msg( |
| "[%d] clone3() with CLONE_SET_TID %d says :%d - expected %d\n", |
| getpid(), set_tid[0], ret, expected); |
| if (ret != expected) |
| ksft_test_result_fail( |
| "[%d] Result (%d) is different than expected (%d)\n", |
| getpid(), ret, expected); |
| else |
| ksft_test_result_pass( |
| "[%d] Result (%d) matches expectation (%d)\n", |
| getpid(), ret, expected); |
| } |
| int main(int argc, char *argv[]) |
| { |
| FILE *f; |
| char buf; |
| char *line; |
| int status; |
| int ret = -1; |
| size_t len = 0; |
| int pid_max = 0; |
| uid_t uid = getuid(); |
| char proc_path[100] = {0}; |
| pid_t pid, ns1, ns2, ns3, ns_pid; |
| pid_t set_tid[MAX_PID_NS_LEVEL * 2]; |
| |
| ksft_print_header(); |
| ksft_set_plan(29); |
| test_clone3_supported(); |
| |
| if (pipe(pipe_1) < 0 || pipe(pipe_2) < 0) |
| ksft_exit_fail_msg("pipe() failed\n"); |
| |
| f = fopen("/proc/sys/kernel/pid_max", "r"); |
| if (f == NULL) |
| ksft_exit_fail_msg( |
| "%s - Could not open /proc/sys/kernel/pid_max\n", |
| strerror(errno)); |
| fscanf(f, "%d", &pid_max); |
| fclose(f); |
| ksft_print_msg("/proc/sys/kernel/pid_max %d\n", pid_max); |
| |
| /* Try invalid settings */ |
| memset(&set_tid, 0, sizeof(set_tid)); |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL + 1, 0, -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 2, 0, -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 2 + 1, 0, |
| -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 42, 0, -EINVAL, 0, 0); |
| |
| /* |
| * This can actually work if this test running in a MAX_PID_NS_LEVEL - 1 |
| * nested PID namespace. |
| */ |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL - 1, 0, -EINVAL, 0, 0); |
| |
| memset(&set_tid, 0xff, sizeof(set_tid)); |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL + 1, 0, -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 2, 0, -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 2 + 1, 0, |
| -EINVAL, 0, 0); |
| |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL * 42, 0, -EINVAL, 0, 0); |
| |
| /* |
| * This can actually work if this test running in a MAX_PID_NS_LEVEL - 1 |
| * nested PID namespace. |
| */ |
| test_clone3_set_tid(set_tid, MAX_PID_NS_LEVEL - 1, 0, -EINVAL, 0, 0); |
| |
| memset(&set_tid, 0, sizeof(set_tid)); |
| /* Try with an invalid PID */ |
| set_tid[0] = 0; |
| test_clone3_set_tid(set_tid, 1, 0, -EINVAL, 0, 0); |
| |
| set_tid[0] = -1; |
| test_clone3_set_tid(set_tid, 1, 0, -EINVAL, 0, 0); |
| |
| /* Claim that the set_tid array actually contains 2 elements. */ |
| test_clone3_set_tid(set_tid, 2, 0, -EINVAL, 0, 0); |
| |
| /* Try it in a new PID namespace */ |
| if (uid == 0) |
| test_clone3_set_tid(set_tid, 1, CLONE_NEWPID, -EINVAL, 0, 0); |
| else |
| ksft_test_result_skip("Clone3() with set_tid requires root\n"); |
| |
| /* Try with a valid PID (1) this should return -EEXIST. */ |
| set_tid[0] = 1; |
| if (uid == 0) |
| test_clone3_set_tid(set_tid, 1, 0, -EEXIST, 0, 0); |
| else |
| ksft_test_result_skip("Clone3() with set_tid requires root\n"); |
| |
| /* Try it in a new PID namespace */ |
| if (uid == 0) |
| test_clone3_set_tid(set_tid, 1, CLONE_NEWPID, 0, 0, 0); |
| else |
| ksft_test_result_skip("Clone3() with set_tid requires root\n"); |
| |
| /* pid_max should fail everywhere */ |
| set_tid[0] = pid_max; |
| test_clone3_set_tid(set_tid, 1, 0, -EINVAL, 0, 0); |
| |
| if (uid == 0) |
| test_clone3_set_tid(set_tid, 1, CLONE_NEWPID, -EINVAL, 0, 0); |
| else |
| ksft_test_result_skip("Clone3() with set_tid requires root\n"); |
| |
| if (uid != 0) { |
| /* |
| * All remaining tests require root. Tell the framework |
| * that all those tests are skipped as non-root. |
| */ |
| ksft_cnt.ksft_xskip += ksft_plan - ksft_test_num(); |
| goto out; |
| } |
| |
| /* Find the current active PID */ |
| pid = fork(); |
| if (pid == 0) { |
| ksft_print_msg("Child has PID %d\n", getpid()); |
| child_exit(EXIT_SUCCESS); |
| } |
| if (waitpid(pid, &status, 0) < 0) |
| ksft_exit_fail_msg("Waiting for child %d failed", pid); |
| |
| /* After the child has finished, its PID should be free. */ |
| set_tid[0] = pid; |
| test_clone3_set_tid(set_tid, 1, 0, 0, 0, 0); |
| |
| /* This should fail as there is no PID 1 in that namespace */ |
| test_clone3_set_tid(set_tid, 1, CLONE_NEWPID, -EINVAL, 0, 0); |
| |
| /* |
| * Creating a process with PID 1 in the newly created most nested |
| * PID namespace and PID 'pid' in the parent PID namespace. This |
| * needs to work. |
| */ |
| set_tid[0] = 1; |
| set_tid[1] = pid; |
| test_clone3_set_tid(set_tid, 2, CLONE_NEWPID, 0, pid, 0); |
| |
| ksft_print_msg("unshare PID namespace\n"); |
| if (unshare(CLONE_NEWPID) == -1) |
| ksft_exit_fail_msg("unshare(CLONE_NEWPID) failed: %s\n", |
| strerror(errno)); |
| |
| set_tid[0] = pid; |
| |
| /* This should fail as there is no PID 1 in that namespace */ |
| test_clone3_set_tid(set_tid, 1, 0, -EINVAL, 0, 0); |
| |
| /* Let's create a PID 1 */ |
| ns_pid = fork(); |
| if (ns_pid == 0) { |
| /* |
| * This and the next test cases check that all pid-s are |
| * released on error paths. |
| */ |
| set_tid[0] = 43; |
| set_tid[1] = -1; |
| test_clone3_set_tid(set_tid, 2, 0, -EINVAL, 0, 0); |
| |
| set_tid[0] = 43; |
| set_tid[1] = pid; |
| test_clone3_set_tid(set_tid, 2, 0, 0, 43, 0); |
| |
| ksft_print_msg("Child in PID namespace has PID %d\n", getpid()); |
| set_tid[0] = 2; |
| test_clone3_set_tid(set_tid, 1, 0, 0, 2, 0); |
| |
| set_tid[0] = 1; |
| set_tid[1] = -1; |
| set_tid[2] = pid; |
| /* This should fail as there is invalid PID at level '1'. */ |
| test_clone3_set_tid(set_tid, 3, CLONE_NEWPID, -EINVAL, 0, 0); |
| |
| set_tid[0] = 1; |
| set_tid[1] = 42; |
| set_tid[2] = pid; |
| /* |
| * This should fail as there are not enough active PID |
| * namespaces. Again assuming this is running in the host's |
| * PID namespace. Not yet nested. |
| */ |
| test_clone3_set_tid(set_tid, 4, CLONE_NEWPID, -EINVAL, 0, 0); |
| |
| /* |
| * This should work and from the parent we should see |
| * something like 'NSpid: pid 42 1'. |
| */ |
| test_clone3_set_tid(set_tid, 3, CLONE_NEWPID, 0, 42, true); |
| |
| child_exit(ksft_cnt.ksft_fail); |
| } |
| |
| close(pipe_1[1]); |
| close(pipe_2[0]); |
| while (read(pipe_1[0], &buf, 1) > 0) { |
| ksft_print_msg("[%d] Child is ready and waiting\n", getpid()); |
| break; |
| } |
| |
| snprintf(proc_path, sizeof(proc_path), "/proc/%d/status", pid); |
| f = fopen(proc_path, "r"); |
| if (f == NULL) |
| ksft_exit_fail_msg( |
| "%s - Could not open %s\n", |
| strerror(errno), proc_path); |
| |
| while (getline(&line, &len, f) != -1) { |
| if (strstr(line, "NSpid")) { |
| int i; |
| |
| /* Verify that all generated PIDs are as expected. */ |
| i = sscanf(line, "NSpid:\t%d\t%d\t%d", |
| &ns3, &ns2, &ns1); |
| if (i != 3) { |
| ksft_print_msg( |
| "Unexpected 'NSPid:' entry: %s", |
| line); |
| ns1 = ns2 = ns3 = 0; |
| } |
| break; |
| } |
| } |
| fclose(f); |
| free(line); |
| close(pipe_2[0]); |
| |
| /* Tell the clone3()'d child to finish. */ |
| write(pipe_2[1], &buf, 1); |
| close(pipe_2[1]); |
| |
| if (waitpid(ns_pid, &status, 0) < 0) { |
| ksft_print_msg("Child returned %s\n", strerror(errno)); |
| ret = -errno; |
| goto out; |
| } |
| |
| if (!WIFEXITED(status)) |
| ksft_test_result_fail("Child error\n"); |
| |
| ksft_cnt.ksft_pass += 6 - (ksft_cnt.ksft_fail - WEXITSTATUS(status)); |
| ksft_cnt.ksft_fail = WEXITSTATUS(status); |
| |
| if (ns3 == pid && ns2 == 42 && ns1 == 1) |
| ksft_test_result_pass( |
| "PIDs in all namespaces as expected (%d,%d,%d)\n", |
| ns3, ns2, ns1); |
| else |
| ksft_test_result_fail( |
| "PIDs in all namespaces not as expected (%d,%d,%d)\n", |
| ns3, ns2, ns1); |
| out: |
| ret = 0; |
| |
| return !ret ? ksft_exit_pass() : ksft_exit_fail(); |
| } |