kernel/hung_task.c: Monitor killed tasks.

author Tetsuo Handa <penguin-kernel@i-love.sakura.ne.jp>

Thu, 22 Apr 2021 06:42:53 +0000 (16:42 +1000)

committer Stephen Rothwell <sfr@canb.auug.org.au>

Wed, 5 May 2021 22:09:20 +0000 (08:09 +1000)
author Tetsuo Handa <penguin-kernel@i-love.sakura.ne.jp>
Thu, 22 Apr 2021 06:42:53 +0000 (16:42 +1000)
committer Stephen Rothwell <sfr@canb.auug.org.au>
Wed, 5 May 2021 22:09:20 +0000 (08:09 +1000)
diff --git a/include/linux/sched.h b/include/linux/sched.h

index 08fb28ead30a7e858cb7b79937ce8017de104a4f..8d5264b18cb66366aa5a8d8f7e6ce11145a17537 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -972,6 +972,7 @@ struct task_struct {
  #ifdef CONFIG_DETECT_HUNG_TASK
         unsigned long                   last_switch_count;
         unsigned long                   last_switch_time;
+       unsigned long                   killed_time;
  #endif
         /* Filesystem information: */
         struct fs_struct                *fs;
diff --git a/kernel/hung_task.c b/kernel/hung_task.c

index 396ebaebea3fea3578fe295c73cf041530a91d93..bb2e3e15c84c0f03dd9b99789ac26c350f26b5cd 100644 (file)
--- a/kernel/hung_task.c
+++ b/kernel/hung_task.c
@@ -144,6 +144,47 @@ static void check_hung_task(struct task_struct *t, unsigned long timeout)
         touch_nmi_watchdog();
  }
  
+static void check_killed_task(struct task_struct *t, unsigned long timeout)
+{
+       unsigned long stamp = t->killed_time;
+
+       /*
+        * Ensure the task is not frozen.
+        * Also, skip vfork and any other user process that freezer should skip.
+        */
+       if (unlikely(t->flags & (PF_FROZEN | PF_FREEZER_SKIP)))
+               return;
+       /*
+        * Skip threads which are already inside do_exit(), for exit_mm() etc.
+        * might take many seconds.
+        */
+       if (t->flags & PF_EXITING)
+               return;
+       if (!stamp) {
+               stamp = jiffies;
+               if (!stamp)
+                       stamp++;
+               t->killed_time = stamp;
+               return;
+       }
+       if (time_is_after_jiffies(stamp + timeout * HZ))
+               return;
+       trace_sched_process_hang(t);
+       if (sysctl_hung_task_panic) {
+               console_verbose();
+               hung_task_call_panic = true;
+       }
+       /*
+        * This thread failed to terminate for more than
+        * sysctl_hung_task_timeout_secs seconds, complain:
+        */
+       pr_err("INFO: task %s:%d can't die for more than %ld seconds.\n",
+              t->comm, t->pid, (jiffies - stamp) / HZ);
+       sched_show_task(t);
+       hung_task_show_lock = true;
+       touch_nmi_watchdog();
+}
+
  /*
   * To avoid extending the RCU grace period for an unbounded amount of time,
   * periodically exit the critical section and enter a new one.
@@ -195,6 +236,9 @@ static void check_hung_uninterruptible_tasks(unsigned long timeout)
                                 goto unlock;
                         last_break = jiffies;
                 }
+               /* Check threads which are about to terminate. */
+               if (unlikely(fatal_signal_pending(t)))
+                       check_killed_task(t, timeout);
                 /* use "==" to skip the TASK_KILLABLE tasks waiting on NFS */
                 if (t->state == TASK_UNINTERRUPTIBLE)
                         check_hung_task(t, timeout);
author	Tetsuo Handa <penguin-kernel@i-love.sakura.ne.jp>
	Thu, 22 Apr 2021 06:42:53 +0000 (16:42 +1000)
committer	Stephen Rothwell <sfr@canb.auug.org.au>
	Wed, 5 May 2021 22:09:20 +0000 (08:09 +1000)
include/linux/sched.h		patch \| blob \| history
kernel/hung_task.c		patch \| blob \| history