This reverts commit bb304a5c6fc63d8506cd9741a3a5f35b73605625.

Because this patch leads to kthread zombies.

call_usermodehelper_exec_sync() does fork() + wait() with "unignored"
SIGCHLD. What we have missed is that this worker thread can have other
children previously forked by call_usermodehelper_exec_work() without
UMH_WAIT_PROC. If such a child exits in between it becomes a zombie
and nobody can reap it (unless/until this worker thread exits too).

Signed-off-by: Oleg Nesterov <o...@redhat.com>
---
 kernel/kmod.c | 44 ++++++++++++++++++++++++--------------------
 1 file changed, 24 insertions(+), 20 deletions(-)

diff --git a/kernel/kmod.c b/kernel/kmod.c
index da98d05..d38b2da 100644
--- a/kernel/kmod.c
+++ b/kernel/kmod.c
@@ -265,9 +265,15 @@ out:
        do_exit(0);
 }
 
-/* Handles UMH_WAIT_PROC.  */
-static void call_usermodehelper_exec_sync(struct subprocess_info *sub_info)
+/*
+ * Handles UMH_WAIT_PROC. Our parent (unbound workqueue) might not be able to
+ * run enough instances to handle usermodehelper completions without blocking
+ * some other pending requests. That's why we use a kernel thread dedicated for
+ * that purpose.
+ */
+static int call_usermodehelper_exec_sync(void *data)
 {
+       struct subprocess_info *sub_info = data;
        pid_t pid;
 
        /* If SIGCLD is ignored sys_wait4 won't populate the status. */
@@ -281,9 +287,9 @@ static void call_usermodehelper_exec_sync(struct 
subprocess_info *sub_info)
                 * Normally it is bogus to call wait4() from in-kernel because
                 * wait4() wants to write the exit code to a userspace address.
                 * But call_usermodehelper_exec_sync() always runs as kernel
-                * thread (workqueue) and put_user() to a kernel address works
-                * OK for kernel threads, due to their having an mm_segment_t
-                * which spans the entire address space.
+                * thread and put_user() to a kernel address works OK for kernel
+                * threads, due to their having an mm_segment_t which spans the
+                * entire address space.
                 *
                 * Thus the __user pointer cast is valid here.
                 */
@@ -298,21 +304,19 @@ static void call_usermodehelper_exec_sync(struct 
subprocess_info *sub_info)
                        sub_info->retval = ret;
        }
 
-       /* Restore default kernel sig handler */
-       kernel_sigaction(SIGCHLD, SIG_IGN);
-
        umh_complete(sub_info);
+       do_exit(0);
 }
 
 /*
- * We need to create the usermodehelper kernel thread from a task that is 
affine
+ * This function doesn't strictly needs to be called asynchronously. But we
+ * need to create the usermodehelper kernel threads from a task that is affine
  * to an optimized set of CPUs (or nohz housekeeping ones) such that they
  * inherit a widest affinity irrespective of call_usermodehelper() callers with
  * possibly reduced affinity (eg: per-cpu workqueues). We don't want
  * usermodehelper targets to contend a busy CPU.
  *
- * Unbound workqueues provide such wide affinity and allow to block on
- * UMH_WAIT_PROC requests without blocking pending request (up to some limit).
+ * Unbound workqueues provide such wide affinity.
  *
  * Besides, workqueues provide the privilege level that caller might not have
  * to perform the usermodehelper request.
@@ -322,18 +326,18 @@ static void call_usermodehelper_exec_work(struct 
work_struct *work)
 {
        struct subprocess_info *sub_info =
                container_of(work, struct subprocess_info, work);
+       pid_t pid;
 
-       if (sub_info->wait & UMH_WAIT_PROC) {
-               call_usermodehelper_exec_sync(sub_info);
-       } else {
-               pid_t pid;
-
+       if (sub_info->wait & UMH_WAIT_PROC)
+               pid = kernel_thread(call_usermodehelper_exec_sync, sub_info,
+                                   CLONE_FS | CLONE_FILES | SIGCHLD);
+       else
                pid = kernel_thread(call_usermodehelper_exec_async, sub_info,
                                    SIGCHLD);
-               if (pid < 0) {
-                       sub_info->retval = pid;
-                       umh_complete(sub_info);
-               }
+
+       if (pid < 0) {
+               sub_info->retval = pid;
+               umh_complete(sub_info);
        }
 }
 
-- 
2.4.3


--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to