blob: 7a1096265f180772021a439c4e394cf7e7c2fb76 [file] [log] [blame]
Guenter Roeckd0173272019-06-20 09:28:46 -07001// SPDX-License-Identifier: GPL-2.0+
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
Alan Coxa5132ca2012-02-28 22:48:11 +00003 * SoftDog: A Software Watchdog Device
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
Wim Van Sebroeck143a2e52009-03-18 08:35:09 +00005 * (c) Copyright 1996 Alan Cox <alan@lxorguk.ukuu.org.uk>,
6 * All Rights Reserved.
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * Neither Alan Cox nor CymruNet Ltd. admit liability nor provide
9 * warranty for any of this software. This material is provided
10 * "AS-IS" and at no charge.
11 *
12 * (c) Copyright 1995 Alan Cox <alan@lxorguk.ukuu.org.uk>
13 *
14 * Software only watchdog driver. Unlike its big brother the WDT501P
15 * driver this won't always recover a failed machine.
Linus Torvalds1da177e2005-04-16 15:20:36 -070016 */
17
Joe Perches27c766a2012-02-15 15:06:19 -080018#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
Niklas Cassel8d5755b2017-02-27 13:49:09 +010020#include <linux/hrtimer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/init.h>
Anithra P Janakiraman7fff4be2011-03-28 14:29:19 -070022#include <linux/kernel.h>
Woody Lin36a89472020-07-08 16:32:19 +080023#include <linux/kthread.h>
Wolfram Sange65c5822016-05-25 08:37:47 +020024#include <linux/module.h>
25#include <linux/moduleparam.h>
26#include <linux/reboot.h>
Wolfram Sange65c5822016-05-25 08:37:47 +020027#include <linux/types.h>
28#include <linux/watchdog.h>
Woody Lin36a89472020-07-08 16:32:19 +080029#include <linux/workqueue.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#define TIMER_MARGIN 60 /* Default is 60 seconds */
Alan Coxa5132ca2012-02-28 22:48:11 +000032static unsigned int soft_margin = TIMER_MARGIN; /* in seconds */
33module_param(soft_margin, uint, 0);
Alan Coxf92d3742008-05-19 14:09:06 +010034MODULE_PARM_DESC(soft_margin,
35 "Watchdog soft_margin in seconds. (0 < soft_margin < 65536, default="
36 __MODULE_STRING(TIMER_MARGIN) ")");
Linus Torvalds1da177e2005-04-16 15:20:36 -070037
Wim Van Sebroeck86a1e182012-03-05 16:51:11 +010038static bool nowayout = WATCHDOG_NOWAYOUT;
39module_param(nowayout, bool, 0);
Alan Coxf92d3742008-05-19 14:09:06 +010040MODULE_PARM_DESC(nowayout,
41 "Watchdog cannot be stopped once started (default="
42 __MODULE_STRING(WATCHDOG_NOWAYOUT) ")");
Linus Torvalds1da177e2005-04-16 15:20:36 -070043
Jingoo Han5f5e1902014-02-27 14:41:42 +090044static int soft_noboot;
Linus Torvalds1da177e2005-04-16 15:20:36 -070045module_param(soft_noboot, int, 0);
Wim Van Sebroecka77dba72009-04-14 20:20:07 +000046MODULE_PARM_DESC(soft_noboot,
Alan Coxa5132ca2012-02-28 22:48:11 +000047 "Softdog action, set to 1 to ignore reboots, 0 to reboot (default=0)");
Linus Torvalds1da177e2005-04-16 15:20:36 -070048
Anithra P Janakiraman7fff4be2011-03-28 14:29:19 -070049static int soft_panic;
50module_param(soft_panic, int, 0);
51MODULE_PARM_DESC(soft_panic,
52 "Softdog action, set to 1 to panic, 0 to reboot (default=0)");
53
Woody Lin36a89472020-07-08 16:32:19 +080054static char *soft_reboot_cmd;
55module_param(soft_reboot_cmd, charp, 0000);
56MODULE_PARM_DESC(soft_reboot_cmd,
57 "Set reboot command. Emergency reboot takes place if unset");
58
59static bool soft_active_on_boot;
60module_param(soft_active_on_boot, bool, 0000);
61MODULE_PARM_DESC(soft_active_on_boot,
62 "Set to true to active Softdog on boot (default=false)");
63
Niklas Cassel8d5755b2017-02-27 13:49:09 +010064static struct hrtimer softdog_ticktock;
65static struct hrtimer softdog_preticktock;
66
Woody Lin36a89472020-07-08 16:32:19 +080067static int reboot_kthread_fn(void *data)
68{
69 kernel_restart(soft_reboot_cmd);
70 return -EPERM; /* Should not reach here */
71}
72
73static void reboot_work_fn(struct work_struct *unused)
74{
75 kthread_run(reboot_kthread_fn, NULL, "softdog_reboot");
76}
77
Niklas Cassel8d5755b2017-02-27 13:49:09 +010078static enum hrtimer_restart softdog_fire(struct hrtimer *timer)
Linus Torvalds1da177e2005-04-16 15:20:36 -070079{
Woody Lin36a89472020-07-08 16:32:19 +080080 static bool soft_reboot_fired;
81
Li RongQing5889f062015-12-17 21:30:02 +080082 module_put(THIS_MODULE);
Wolfram Sang4a23e2b2016-05-25 08:37:49 +020083 if (soft_noboot) {
Joe Perches27c766a2012-02-15 15:06:19 -080084 pr_crit("Triggered - Reboot ignored\n");
Wolfram Sang4a23e2b2016-05-25 08:37:49 +020085 } else if (soft_panic) {
Joe Perches27c766a2012-02-15 15:06:19 -080086 pr_crit("Initiating panic\n");
87 panic("Software Watchdog Timer expired");
Anithra P Janakiraman7fff4be2011-03-28 14:29:19 -070088 } else {
Joe Perches27c766a2012-02-15 15:06:19 -080089 pr_crit("Initiating system reboot\n");
Woody Lin36a89472020-07-08 16:32:19 +080090 if (!soft_reboot_fired && soft_reboot_cmd != NULL) {
91 static DECLARE_WORK(reboot_work, reboot_work_fn);
92 /*
93 * The 'kernel_restart' is a 'might-sleep' operation.
94 * Also, executing it in system-wide workqueues blocks
95 * any driver from using the same workqueue in its
96 * shutdown callback function. Thus, we should execute
97 * the 'kernel_restart' in a standalone kernel thread.
98 * But since starting a kernel thread is also a
99 * 'might-sleep' operation, so the 'reboot_work' is
100 * required as a launcher of the kernel thread.
101 *
102 * After request the reboot, restart the timer to
103 * schedule an 'emergency_restart' reboot after
104 * 'TIMER_MARGIN' seconds. It's because if the softdog
105 * hangs, it might be because of scheduling issues. And
106 * if that is the case, both 'schedule_work' and
107 * 'kernel_restart' may possibly be malfunctional at the
108 * same time.
109 */
110 soft_reboot_fired = true;
111 schedule_work(&reboot_work);
112 hrtimer_add_expires_ns(timer,
113 (u64)TIMER_MARGIN * NSEC_PER_SEC);
114
115 return HRTIMER_RESTART;
116 }
Andrew Morton479d0f42005-07-26 21:41:38 -0700117 emergency_restart();
Joe Perches27c766a2012-02-15 15:06:19 -0800118 pr_crit("Reboot didn't ?????\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100121 return HRTIMER_NORESTART;
122}
Wolfram Sang44ba0f02016-05-25 08:37:46 +0200123
Wolfram Sang2accf322016-10-07 15:41:38 +0300124static struct watchdog_device softdog_dev;
125
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100126static enum hrtimer_restart softdog_pretimeout(struct hrtimer *timer)
Wolfram Sang2accf322016-10-07 15:41:38 +0300127{
128 watchdog_notify_pretimeout(&softdog_dev);
Wolfram Sang2accf322016-10-07 15:41:38 +0300129
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100130 return HRTIMER_NORESTART;
131}
Wolfram Sang2accf322016-10-07 15:41:38 +0300132
Alan Coxa5132ca2012-02-28 22:48:11 +0000133static int softdog_ping(struct watchdog_device *w)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134{
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100135 if (!hrtimer_active(&softdog_ticktock))
Li RongQing5889f062015-12-17 21:30:02 +0800136 __module_get(THIS_MODULE);
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100137 hrtimer_start(&softdog_ticktock, ktime_set(w->timeout, 0),
138 HRTIMER_MODE_REL);
Wolfram Sang2accf322016-10-07 15:41:38 +0300139
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100140 if (IS_ENABLED(CONFIG_SOFT_WATCHDOG_PRETIMEOUT)) {
141 if (w->pretimeout)
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100142 hrtimer_start(&softdog_preticktock,
143 ktime_set(w->timeout - w->pretimeout, 0),
144 HRTIMER_MODE_REL);
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100145 else
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100146 hrtimer_cancel(&softdog_preticktock);
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100147 }
Wolfram Sang2accf322016-10-07 15:41:38 +0300148
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149 return 0;
150}
151
Alan Coxa5132ca2012-02-28 22:48:11 +0000152static int softdog_stop(struct watchdog_device *w)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153{
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100154 if (hrtimer_cancel(&softdog_ticktock))
Li RongQing5889f062015-12-17 21:30:02 +0800155 module_put(THIS_MODULE);
156
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100157 if (IS_ENABLED(CONFIG_SOFT_WATCHDOG_PRETIMEOUT))
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100158 hrtimer_cancel(&softdog_preticktock);
Wolfram Sang2accf322016-10-07 15:41:38 +0300159
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 return 0;
161}
162
Alan Coxa5132ca2012-02-28 22:48:11 +0000163static struct watchdog_info softdog_info = {
164 .identity = "Software Watchdog",
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100165 .options = WDIOF_SETTIMEOUT | WDIOF_KEEPALIVEPING | WDIOF_MAGICCLOSE,
Alan Coxa5132ca2012-02-28 22:48:11 +0000166};
167
Julia Lawall85f15cf2016-09-01 19:35:26 +0200168static const struct watchdog_ops softdog_ops = {
Alan Coxa5132ca2012-02-28 22:48:11 +0000169 .owner = THIS_MODULE,
170 .start = softdog_ping,
171 .stop = softdog_stop,
Alan Coxa5132ca2012-02-28 22:48:11 +0000172};
173
174static struct watchdog_device softdog_dev = {
175 .info = &softdog_info,
176 .ops = &softdog_ops,
177 .min_timeout = 1,
Wolfram Sange8cf96a2016-05-25 08:37:44 +0200178 .max_timeout = 65535,
179 .timeout = TIMER_MARGIN,
Alan Coxa5132ca2012-02-28 22:48:11 +0000180};
181
Wolfram Sang0efc70b2016-05-25 08:37:45 +0200182static int __init softdog_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183{
184 int ret;
185
Wolfram Sange8cf96a2016-05-25 08:37:44 +0200186 watchdog_init_timeout(&softdog_dev, soft_margin, NULL);
Alan Coxa5132ca2012-02-28 22:48:11 +0000187 watchdog_set_nowayout(&softdog_dev, nowayout);
Damien Riegel84ebcc12015-11-20 16:54:55 -0500188 watchdog_stop_on_reboot(&softdog_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100190 hrtimer_init(&softdog_ticktock, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
191 softdog_ticktock.function = softdog_fire;
192
193 if (IS_ENABLED(CONFIG_SOFT_WATCHDOG_PRETIMEOUT)) {
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100194 softdog_info.options |= WDIOF_PRETIMEOUT;
Niklas Cassel8d5755b2017-02-27 13:49:09 +0100195 hrtimer_init(&softdog_preticktock, CLOCK_MONOTONIC,
196 HRTIMER_MODE_REL);
197 softdog_preticktock.function = softdog_pretimeout;
198 }
Wolfram Sang4cbc6902017-02-07 15:03:29 +0100199
Woody Lin36a89472020-07-08 16:32:19 +0800200 if (soft_active_on_boot)
201 softdog_ping(&softdog_dev);
202
Alan Coxa5132ca2012-02-28 22:48:11 +0000203 ret = watchdog_register_device(&softdog_dev);
Damien Riegel84ebcc12015-11-20 16:54:55 -0500204 if (ret)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206
Wolfram Sange8cf96a2016-05-25 08:37:44 +0200207 pr_info("initialized. soft_noboot=%d soft_margin=%d sec soft_panic=%d (nowayout=%d)\n",
208 soft_noboot, softdog_dev.timeout, soft_panic, nowayout);
Woody Lin36a89472020-07-08 16:32:19 +0800209 pr_info(" soft_reboot_cmd=%s soft_active_on_boot=%d\n",
210 soft_reboot_cmd ?: "<not set>", soft_active_on_boot);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211
212 return 0;
213}
Wolfram Sang0efc70b2016-05-25 08:37:45 +0200214module_init(softdog_init);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215
Wolfram Sang0efc70b2016-05-25 08:37:45 +0200216static void __exit softdog_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217{
Alan Coxa5132ca2012-02-28 22:48:11 +0000218 watchdog_unregister_device(&softdog_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219}
Wolfram Sang0efc70b2016-05-25 08:37:45 +0200220module_exit(softdog_exit);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
222MODULE_AUTHOR("Alan Cox");
223MODULE_DESCRIPTION("Software Watchdog Device Driver");
224MODULE_LICENSE("GPL");