| // SPDX-License-Identifier: GPL-2.0 |
| /* |
| * fs/signalfd.c |
| * |
| * Copyright (C) 2003 Linus Torvalds |
| * |
| * Mon Mar 5, 2007: Davide Libenzi <davidel@xmailserver.org> |
| * Changed ->read() to return a siginfo strcture instead of signal number. |
| * Fixed locking in ->poll(). |
| * Added sighand-detach notification. |
| * Added fd re-use in sys_signalfd() syscall. |
| * Now using anonymous inode source. |
| * Thanks to Oleg Nesterov for useful code review and suggestions. |
| * More comments and suggestions from Arnd Bergmann. |
| * Sat May 19, 2007: Davi E. M. Arnaut <davi@haxent.com.br> |
| * Retrieve multiple signals with one read() call |
| * Sun Jul 15, 2007: Davide Libenzi <davidel@xmailserver.org> |
| * Attach to the sighand only during read() and poll(). |
| */ |
| |
| #include <linux/file.h> |
| #include <linux/poll.h> |
| #include <linux/init.h> |
| #include <linux/fs.h> |
| #include <linux/sched.h> |
| #include <linux/slab.h> |
| #include <linux/kernel.h> |
| #include <linux/signal.h> |
| #include <linux/list.h> |
| #include <linux/anon_inodes.h> |
| #include <linux/signalfd.h> |
| #include <linux/syscalls.h> |
| #include <linux/proc_fs.h> |
| #include <linux/compat.h> |
| |
| void signalfd_cleanup(struct sighand_struct *sighand) |
| { |
| wait_queue_head_t *wqh = &sighand->signalfd_wqh; |
| /* |
| * The lockless check can race with remove_wait_queue() in progress, |
| * but in this case its caller should run under rcu_read_lock() and |
| * sighand_cachep is SLAB_TYPESAFE_BY_RCU, we can safely return. |
| */ |
| if (likely(!waitqueue_active(wqh))) |
| return; |
| |
| /* wait_queue_entry_t->func(POLLFREE) should do remove_wait_queue() */ |
| wake_up_poll(wqh, EPOLLHUP | POLLFREE); |
| } |
| |
| struct signalfd_ctx { |
| sigset_t sigmask; |
| }; |
| |
| static int signalfd_release(struct inode *inode, struct file *file) |
| { |
| kfree(file->private_data); |
| return 0; |
| } |
| |
| static __poll_t signalfd_poll(struct file *file, poll_table *wait) |
| { |
| struct signalfd_ctx *ctx = file->private_data; |
| __poll_t events = 0; |
| |
| poll_wait(file, ¤t->sighand->signalfd_wqh, wait); |
| |
| spin_lock_irq(¤t->sighand->siglock); |
| if (next_signal(¤t->pending, &ctx->sigmask) || |
| next_signal(¤t->signal->shared_pending, |
| &ctx->sigmask)) |
| events |= EPOLLIN; |
| spin_unlock_irq(¤t->sighand->siglock); |
| |
| return events; |
| } |
| |
| /* |
| * Copied from copy_siginfo_to_user() in kernel/signal.c |
| */ |
| static int signalfd_copyinfo(struct signalfd_siginfo __user *uinfo, |
| kernel_siginfo_t const *kinfo) |
| { |
| struct signalfd_siginfo new; |
| |
| BUILD_BUG_ON(sizeof(struct signalfd_siginfo) != 128); |
| |
| /* |
| * Unused members should be zero ... |
| */ |
| memset(&new, 0, sizeof(new)); |
| |
| /* |
| * If you change siginfo_t structure, please be sure |
| * this code is fixed accordingly. |
| */ |
| new.ssi_signo = kinfo->si_signo; |
| new.ssi_errno = kinfo->si_errno; |
| new.ssi_code = kinfo->si_code; |
| switch (siginfo_layout(kinfo->si_signo, kinfo->si_code)) { |
| case SIL_KILL: |
| new.ssi_pid = kinfo->si_pid; |
| new.ssi_uid = kinfo->si_uid; |
| break; |
| case SIL_TIMER: |
| new.ssi_tid = kinfo->si_tid; |
| new.ssi_overrun = kinfo->si_overrun; |
| new.ssi_ptr = (long) kinfo->si_ptr; |
| new.ssi_int = kinfo->si_int; |
| break; |
| case SIL_POLL: |
| new.ssi_band = kinfo->si_band; |
| new.ssi_fd = kinfo->si_fd; |
| break; |
| case SIL_FAULT_BNDERR: |
| case SIL_FAULT_PKUERR: |
| /* |
| * Fall through to the SIL_FAULT case. Both SIL_FAULT_BNDERR |
| * and SIL_FAULT_PKUERR are only generated by faults that |
| * deliver them synchronously to userspace. In case someone |
| * injects one of these signals and signalfd catches it treat |
| * it as SIL_FAULT. |
| */ |
| case SIL_FAULT: |
| new.ssi_addr = (long) kinfo->si_addr; |
| #ifdef __ARCH_SI_TRAPNO |
| new.ssi_trapno = kinfo->si_trapno; |
| #endif |
| break; |
| case SIL_FAULT_MCEERR: |
| new.ssi_addr = (long) kinfo->si_addr; |
| #ifdef __ARCH_SI_TRAPNO |
| new.ssi_trapno = kinfo->si_trapno; |
| #endif |
| new.ssi_addr_lsb = (short) kinfo->si_addr_lsb; |
| break; |
| case SIL_PERF_EVENT: |
| new.ssi_addr = (long) kinfo->si_addr; |
| new.ssi_perf = kinfo->si_perf; |
| break; |
| case SIL_CHLD: |
| new.ssi_pid = kinfo->si_pid; |
| new.ssi_uid = kinfo->si_uid; |
| new.ssi_status = kinfo->si_status; |
| new.ssi_utime = kinfo->si_utime; |
| new.ssi_stime = kinfo->si_stime; |
| break; |
| case SIL_RT: |
| /* |
| * This case catches also the signals queued by sigqueue(). |
| */ |
| new.ssi_pid = kinfo->si_pid; |
| new.ssi_uid = kinfo->si_uid; |
| new.ssi_ptr = (long) kinfo->si_ptr; |
| new.ssi_int = kinfo->si_int; |
| break; |
| case SIL_SYS: |
| new.ssi_call_addr = (long) kinfo->si_call_addr; |
| new.ssi_syscall = kinfo->si_syscall; |
| new.ssi_arch = kinfo->si_arch; |
| break; |
| } |
| |
| if (copy_to_user(uinfo, &new, sizeof(struct signalfd_siginfo))) |
| return -EFAULT; |
| |
| return sizeof(*uinfo); |
| } |
| |
| static ssize_t signalfd_dequeue(struct signalfd_ctx *ctx, kernel_siginfo_t *info, |
| int nonblock) |
| { |
| ssize_t ret; |
| DECLARE_WAITQUEUE(wait, current); |
| |
| spin_lock_irq(¤t->sighand->siglock); |
| ret = dequeue_signal(current, &ctx->sigmask, info); |
| switch (ret) { |
| case 0: |
| if (!nonblock) |
| break; |
| ret = -EAGAIN; |
| fallthrough; |
| default: |
| spin_unlock_irq(¤t->sighand->siglock); |
| return ret; |
| } |
| |
| add_wait_queue(¤t->sighand->signalfd_wqh, &wait); |
| for (;;) { |
| set_current_state(TASK_INTERRUPTIBLE); |
| ret = dequeue_signal(current, &ctx->sigmask, info); |
| if (ret != 0) |
| break; |
| if (signal_pending(current)) { |
| ret = -ERESTARTSYS; |
| break; |
| } |
| spin_unlock_irq(¤t->sighand->siglock); |
| schedule(); |
| spin_lock_irq(¤t->sighand->siglock); |
| } |
| spin_unlock_irq(¤t->sighand->siglock); |
| |
| remove_wait_queue(¤t->sighand->signalfd_wqh, &wait); |
| __set_current_state(TASK_RUNNING); |
| |
| return ret; |
| } |
| |
| /* |
| * Returns a multiple of the size of a "struct signalfd_siginfo", or a negative |
| * error code. The "count" parameter must be at least the size of a |
| * "struct signalfd_siginfo". |
| */ |
| static ssize_t signalfd_read(struct file *file, char __user *buf, size_t count, |
| loff_t *ppos) |
| { |
| struct signalfd_ctx *ctx = file->private_data; |
| struct signalfd_siginfo __user *siginfo; |
| int nonblock = file->f_flags & O_NONBLOCK; |
| ssize_t ret, total = 0; |
| kernel_siginfo_t info; |
| |
| count /= sizeof(struct signalfd_siginfo); |
| if (!count) |
| return -EINVAL; |
| |
| siginfo = (struct signalfd_siginfo __user *) buf; |
| do { |
| ret = signalfd_dequeue(ctx, &info, nonblock); |
| if (unlikely(ret <= 0)) |
| break; |
| ret = signalfd_copyinfo(siginfo, &info); |
| if (ret < 0) |
| break; |
| siginfo++; |
| total += ret; |
| nonblock = 1; |
| } while (--count); |
| |
| return total ? total: ret; |
| } |
| |
| #ifdef CONFIG_PROC_FS |
| static void signalfd_show_fdinfo(struct seq_file *m, struct file *f) |
| { |
| struct signalfd_ctx *ctx = f->private_data; |
| sigset_t sigmask; |
| |
| sigmask = ctx->sigmask; |
| signotset(&sigmask); |
| render_sigset_t(m, "sigmask:\t", &sigmask); |
| } |
| #endif |
| |
| static const struct file_operations signalfd_fops = { |
| #ifdef CONFIG_PROC_FS |
| .show_fdinfo = signalfd_show_fdinfo, |
| #endif |
| .release = signalfd_release, |
| .poll = signalfd_poll, |
| .read = signalfd_read, |
| .llseek = noop_llseek, |
| }; |
| |
| static int do_signalfd4(int ufd, sigset_t *mask, int flags) |
| { |
| struct signalfd_ctx *ctx; |
| |
| /* Check the SFD_* constants for consistency. */ |
| BUILD_BUG_ON(SFD_CLOEXEC != O_CLOEXEC); |
| BUILD_BUG_ON(SFD_NONBLOCK != O_NONBLOCK); |
| |
| if (flags & ~(SFD_CLOEXEC | SFD_NONBLOCK)) |
| return -EINVAL; |
| |
| sigdelsetmask(mask, sigmask(SIGKILL) | sigmask(SIGSTOP)); |
| signotset(mask); |
| |
| if (ufd == -1) { |
| ctx = kmalloc(sizeof(*ctx), GFP_KERNEL); |
| if (!ctx) |
| return -ENOMEM; |
| |
| ctx->sigmask = *mask; |
| |
| /* |
| * When we call this, the initialization must be complete, since |
| * anon_inode_getfd() will install the fd. |
| */ |
| ufd = anon_inode_getfd("[signalfd]", &signalfd_fops, ctx, |
| O_RDWR | (flags & (O_CLOEXEC | O_NONBLOCK))); |
| if (ufd < 0) |
| kfree(ctx); |
| } else { |
| struct fd f = fdget(ufd); |
| if (!f.file) |
| return -EBADF; |
| ctx = f.file->private_data; |
| if (f.file->f_op != &signalfd_fops) { |
| fdput(f); |
| return -EINVAL; |
| } |
| spin_lock_irq(¤t->sighand->siglock); |
| ctx->sigmask = *mask; |
| spin_unlock_irq(¤t->sighand->siglock); |
| |
| wake_up(¤t->sighand->signalfd_wqh); |
| fdput(f); |
| } |
| |
| return ufd; |
| } |
| |
| SYSCALL_DEFINE4(signalfd4, int, ufd, sigset_t __user *, user_mask, |
| size_t, sizemask, int, flags) |
| { |
| sigset_t mask; |
| |
| if (sizemask != sizeof(sigset_t)) |
| return -EINVAL; |
| if (copy_from_user(&mask, user_mask, sizeof(mask))) |
| return -EFAULT; |
| return do_signalfd4(ufd, &mask, flags); |
| } |
| |
| SYSCALL_DEFINE3(signalfd, int, ufd, sigset_t __user *, user_mask, |
| size_t, sizemask) |
| { |
| sigset_t mask; |
| |
| if (sizemask != sizeof(sigset_t)) |
| return -EINVAL; |
| if (copy_from_user(&mask, user_mask, sizeof(mask))) |
| return -EFAULT; |
| return do_signalfd4(ufd, &mask, 0); |
| } |
| |
| #ifdef CONFIG_COMPAT |
| static long do_compat_signalfd4(int ufd, |
| const compat_sigset_t __user *user_mask, |
| compat_size_t sigsetsize, int flags) |
| { |
| sigset_t mask; |
| |
| if (sigsetsize != sizeof(compat_sigset_t)) |
| return -EINVAL; |
| if (get_compat_sigset(&mask, user_mask)) |
| return -EFAULT; |
| return do_signalfd4(ufd, &mask, flags); |
| } |
| |
| COMPAT_SYSCALL_DEFINE4(signalfd4, int, ufd, |
| const compat_sigset_t __user *, user_mask, |
| compat_size_t, sigsetsize, |
| int, flags) |
| { |
| return do_compat_signalfd4(ufd, user_mask, sigsetsize, flags); |
| } |
| |
| COMPAT_SYSCALL_DEFINE3(signalfd, int, ufd, |
| const compat_sigset_t __user *, user_mask, |
| compat_size_t, sigsetsize) |
| { |
| return do_compat_signalfd4(ufd, user_mask, sigsetsize, 0); |
| } |
| #endif |