signalfd.c 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343
  1. /*
  2. * fs/signalfd.c
  3. *
  4. * Copyright (C) 2003 Linus Torvalds
  5. *
  6. * Mon Mar 5, 2007: Davide Libenzi <davidel@xmailserver.org>
  7. * Changed ->read() to return a siginfo strcture instead of signal number.
  8. * Fixed locking in ->poll().
  9. * Added sighand-detach notification.
  10. * Added fd re-use in sys_signalfd() syscall.
  11. * Now using anonymous inode source.
  12. * Thanks to Oleg Nesterov for useful code review and suggestions.
  13. * More comments and suggestions from Arnd Bergmann.
  14. * Sat May 19, 2007: Davi E. M. Arnaut <davi@haxent.com.br>
  15. * Retrieve multiple signals with one read() call
  16. * Sun Jul 15, 2007: Davide Libenzi <davidel@xmailserver.org>
  17. * Attach to the sighand only during read() and poll().
  18. */
  19. #include <linux/file.h>
  20. #include <linux/poll.h>
  21. #include <linux/init.h>
  22. #include <linux/fs.h>
  23. #include <linux/sched.h>
  24. #include <linux/slab.h>
  25. #include <linux/kernel.h>
  26. #include <linux/signal.h>
  27. #include <linux/list.h>
  28. #include <linux/anon_inodes.h>
  29. #include <linux/signalfd.h>
  30. #include <linux/syscalls.h>
  31. #include <linux/proc_fs.h>
  32. #include <linux/compat.h>
  33. void signalfd_cleanup(struct sighand_struct *sighand)
  34. {
  35. wait_queue_head_t *wqh = &sighand->signalfd_wqh;
  36. /*
  37. * The lockless check can race with remove_wait_queue() in progress,
  38. * but in this case its caller should run under rcu_read_lock() and
  39. * sighand_cachep is SLAB_DESTROY_BY_RCU, we can safely return.
  40. */
  41. if (likely(!waitqueue_active(wqh)))
  42. return;
  43. /* wait_queue_t->func(POLLFREE) should do remove_wait_queue() */
  44. wake_up_poll(wqh, POLLHUP | POLLFREE);
  45. }
  46. struct signalfd_ctx {
  47. sigset_t sigmask;
  48. };
  49. static int signalfd_release(struct inode *inode, struct file *file)
  50. {
  51. kfree(file->private_data);
  52. return 0;
  53. }
  54. static unsigned int signalfd_poll(struct file *file, poll_table *wait)
  55. {
  56. struct signalfd_ctx *ctx = file->private_data;
  57. unsigned int events = 0;
  58. poll_wait(file, &current->sighand->signalfd_wqh, wait);
  59. spin_lock_irq(&current->sighand->siglock);
  60. if (next_signal(&current->pending, &ctx->sigmask) ||
  61. next_signal(&current->signal->shared_pending,
  62. &ctx->sigmask))
  63. events |= POLLIN;
  64. spin_unlock_irq(&current->sighand->siglock);
  65. return events;
  66. }
  67. /*
  68. * Copied from copy_siginfo_to_user() in kernel/signal.c
  69. */
  70. static int signalfd_copyinfo(struct signalfd_siginfo __user *uinfo,
  71. siginfo_t const *kinfo)
  72. {
  73. long err;
  74. BUILD_BUG_ON(sizeof(struct signalfd_siginfo) != 128);
  75. /*
  76. * Unused members should be zero ...
  77. */
  78. err = __clear_user(uinfo, sizeof(*uinfo));
  79. /*
  80. * If you change siginfo_t structure, please be sure
  81. * this code is fixed accordingly.
  82. */
  83. err |= __put_user(kinfo->si_signo, &uinfo->ssi_signo);
  84. err |= __put_user(kinfo->si_errno, &uinfo->ssi_errno);
  85. err |= __put_user((short) kinfo->si_code, &uinfo->ssi_code);
  86. switch (kinfo->si_code & __SI_MASK) {
  87. case __SI_KILL:
  88. err |= __put_user(kinfo->si_pid, &uinfo->ssi_pid);
  89. err |= __put_user(kinfo->si_uid, &uinfo->ssi_uid);
  90. break;
  91. case __SI_TIMER:
  92. err |= __put_user(kinfo->si_tid, &uinfo->ssi_tid);
  93. err |= __put_user(kinfo->si_overrun, &uinfo->ssi_overrun);
  94. err |= __put_user((long) kinfo->si_ptr, &uinfo->ssi_ptr);
  95. err |= __put_user(kinfo->si_int, &uinfo->ssi_int);
  96. break;
  97. case __SI_POLL:
  98. err |= __put_user(kinfo->si_band, &uinfo->ssi_band);
  99. err |= __put_user(kinfo->si_fd, &uinfo->ssi_fd);
  100. break;
  101. case __SI_FAULT:
  102. err |= __put_user((long) kinfo->si_addr, &uinfo->ssi_addr);
  103. #ifdef __ARCH_SI_TRAPNO
  104. err |= __put_user(kinfo->si_trapno, &uinfo->ssi_trapno);
  105. #endif
  106. #ifdef BUS_MCEERR_AO
  107. /*
  108. * Other callers might not initialize the si_lsb field,
  109. * so check explicitly for the right codes here.
  110. */
  111. if (kinfo->si_code == BUS_MCEERR_AR ||
  112. kinfo->si_code == BUS_MCEERR_AO)
  113. err |= __put_user((short) kinfo->si_addr_lsb,
  114. &uinfo->ssi_addr_lsb);
  115. #endif
  116. break;
  117. case __SI_CHLD:
  118. err |= __put_user(kinfo->si_pid, &uinfo->ssi_pid);
  119. err |= __put_user(kinfo->si_uid, &uinfo->ssi_uid);
  120. err |= __put_user(kinfo->si_status, &uinfo->ssi_status);
  121. err |= __put_user(kinfo->si_utime, &uinfo->ssi_utime);
  122. err |= __put_user(kinfo->si_stime, &uinfo->ssi_stime);
  123. break;
  124. case __SI_RT: /* This is not generated by the kernel as of now. */
  125. case __SI_MESGQ: /* But this is */
  126. err |= __put_user(kinfo->si_pid, &uinfo->ssi_pid);
  127. err |= __put_user(kinfo->si_uid, &uinfo->ssi_uid);
  128. err |= __put_user((long) kinfo->si_ptr, &uinfo->ssi_ptr);
  129. err |= __put_user(kinfo->si_int, &uinfo->ssi_int);
  130. break;
  131. default:
  132. /*
  133. * This case catches also the signals queued by sigqueue().
  134. */
  135. err |= __put_user(kinfo->si_pid, &uinfo->ssi_pid);
  136. err |= __put_user(kinfo->si_uid, &uinfo->ssi_uid);
  137. err |= __put_user((long) kinfo->si_ptr, &uinfo->ssi_ptr);
  138. err |= __put_user(kinfo->si_int, &uinfo->ssi_int);
  139. break;
  140. }
  141. return err ? -EFAULT: sizeof(*uinfo);
  142. }
  143. static ssize_t signalfd_dequeue(struct signalfd_ctx *ctx, siginfo_t *info,
  144. int nonblock)
  145. {
  146. ssize_t ret;
  147. DECLARE_WAITQUEUE(wait, current);
  148. spin_lock_irq(&current->sighand->siglock);
  149. ret = dequeue_signal(current, &ctx->sigmask, info);
  150. switch (ret) {
  151. case 0:
  152. if (!nonblock)
  153. break;
  154. ret = -EAGAIN;
  155. default:
  156. spin_unlock_irq(&current->sighand->siglock);
  157. return ret;
  158. }
  159. add_wait_queue(&current->sighand->signalfd_wqh, &wait);
  160. for (;;) {
  161. set_current_state(TASK_INTERRUPTIBLE);
  162. ret = dequeue_signal(current, &ctx->sigmask, info);
  163. if (ret != 0)
  164. break;
  165. if (signal_pending(current)) {
  166. ret = -ERESTARTSYS;
  167. break;
  168. }
  169. spin_unlock_irq(&current->sighand->siglock);
  170. schedule();
  171. spin_lock_irq(&current->sighand->siglock);
  172. }
  173. spin_unlock_irq(&current->sighand->siglock);
  174. remove_wait_queue(&current->sighand->signalfd_wqh, &wait);
  175. __set_current_state(TASK_RUNNING);
  176. return ret;
  177. }
  178. /*
  179. * Returns a multiple of the size of a "struct signalfd_siginfo", or a negative
  180. * error code. The "count" parameter must be at least the size of a
  181. * "struct signalfd_siginfo".
  182. */
  183. static ssize_t signalfd_read(struct file *file, char __user *buf, size_t count,
  184. loff_t *ppos)
  185. {
  186. struct signalfd_ctx *ctx = file->private_data;
  187. struct signalfd_siginfo __user *siginfo;
  188. int nonblock = file->f_flags & O_NONBLOCK;
  189. ssize_t ret, total = 0;
  190. siginfo_t info;
  191. count /= sizeof(struct signalfd_siginfo);
  192. if (!count)
  193. return -EINVAL;
  194. siginfo = (struct signalfd_siginfo __user *) buf;
  195. do {
  196. ret = signalfd_dequeue(ctx, &info, nonblock);
  197. if (unlikely(ret <= 0))
  198. break;
  199. ret = signalfd_copyinfo(siginfo, &info);
  200. if (ret < 0)
  201. break;
  202. siginfo++;
  203. total += ret;
  204. nonblock = 1;
  205. } while (--count);
  206. return total ? total: ret;
  207. }
  208. #ifdef CONFIG_PROC_FS
  209. static void signalfd_show_fdinfo(struct seq_file *m, struct file *f)
  210. {
  211. struct signalfd_ctx *ctx = f->private_data;
  212. sigset_t sigmask;
  213. sigmask = ctx->sigmask;
  214. signotset(&sigmask);
  215. render_sigset_t(m, "sigmask:\t", &sigmask);
  216. }
  217. #endif
  218. static const struct file_operations signalfd_fops = {
  219. #ifdef CONFIG_PROC_FS
  220. .show_fdinfo = signalfd_show_fdinfo,
  221. #endif
  222. .release = signalfd_release,
  223. .poll = signalfd_poll,
  224. .read = signalfd_read,
  225. .llseek = noop_llseek,
  226. };
  227. SYSCALL_DEFINE4(signalfd4, int, ufd, sigset_t __user *, user_mask,
  228. size_t, sizemask, int, flags)
  229. {
  230. sigset_t sigmask;
  231. struct signalfd_ctx *ctx;
  232. /* Check the SFD_* constants for consistency. */
  233. BUILD_BUG_ON(SFD_CLOEXEC != O_CLOEXEC);
  234. BUILD_BUG_ON(SFD_NONBLOCK != O_NONBLOCK);
  235. if (flags & ~(SFD_CLOEXEC | SFD_NONBLOCK))
  236. return -EINVAL;
  237. if (sizemask != sizeof(sigset_t) ||
  238. copy_from_user(&sigmask, user_mask, sizeof(sigmask)))
  239. return -EINVAL;
  240. sigdelsetmask(&sigmask, sigmask(SIGKILL) | sigmask(SIGSTOP));
  241. signotset(&sigmask);
  242. if (ufd == -1) {
  243. ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
  244. if (!ctx)
  245. return -ENOMEM;
  246. ctx->sigmask = sigmask;
  247. /*
  248. * When we call this, the initialization must be complete, since
  249. * anon_inode_getfd() will install the fd.
  250. */
  251. ufd = anon_inode_getfd("[signalfd]", &signalfd_fops, ctx,
  252. O_RDWR | (flags & (O_CLOEXEC | O_NONBLOCK)));
  253. if (ufd < 0)
  254. kfree(ctx);
  255. } else {
  256. struct fd f = fdget(ufd);
  257. if (!f.file)
  258. return -EBADF;
  259. ctx = f.file->private_data;
  260. if (f.file->f_op != &signalfd_fops) {
  261. fdput(f);
  262. return -EINVAL;
  263. }
  264. spin_lock_irq(&current->sighand->siglock);
  265. ctx->sigmask = sigmask;
  266. spin_unlock_irq(&current->sighand->siglock);
  267. wake_up(&current->sighand->signalfd_wqh);
  268. fdput(f);
  269. }
  270. return ufd;
  271. }
  272. SYSCALL_DEFINE3(signalfd, int, ufd, sigset_t __user *, user_mask,
  273. size_t, sizemask)
  274. {
  275. return sys_signalfd4(ufd, user_mask, sizemask, 0);
  276. }
  277. #ifdef CONFIG_COMPAT
  278. COMPAT_SYSCALL_DEFINE4(signalfd4, int, ufd,
  279. const compat_sigset_t __user *,sigmask,
  280. compat_size_t, sigsetsize,
  281. int, flags)
  282. {
  283. compat_sigset_t ss32;
  284. sigset_t tmp;
  285. sigset_t __user *ksigmask;
  286. if (sigsetsize != sizeof(compat_sigset_t))
  287. return -EINVAL;
  288. if (copy_from_user(&ss32, sigmask, sizeof(ss32)))
  289. return -EFAULT;
  290. sigset_from_compat(&tmp, &ss32);
  291. ksigmask = compat_alloc_user_space(sizeof(sigset_t));
  292. if (copy_to_user(ksigmask, &tmp, sizeof(sigset_t)))
  293. return -EFAULT;
  294. return sys_signalfd4(ufd, ksigmask, sizeof(sigset_t), flags);
  295. }
  296. COMPAT_SYSCALL_DEFINE3(signalfd, int, ufd,
  297. const compat_sigset_t __user *,sigmask,
  298. compat_size_t, sigsetsize)
  299. {
  300. return compat_sys_signalfd4(ufd, sigmask, sigsetsize, 0);
  301. }
  302. #endif