www.infradead.org Git - users/jedix/linux-maple.git/blob

1 /*

2 * linux/kernel/panic.c

3 *

5 */

7 /*

8 * This function is used through-out the kernel (including mm and fs)

9 * to indicate a major problem.

10 */

11 #include <linux/debug_locks.h>

12 #include <linux/interrupt.h>

13 #include <linux/kmsg_dump.h>

14 #include <linux/kallsyms.h>

15 #include <linux/notifier.h>

16 #include <linux/module.h>

17 #include <linux/random.h>

18 #include <linux/ftrace.h>

19 #include <linux/reboot.h>

20 #include <linux/delay.h>

21 #include <linux/kexec.h>

22 #include <linux/sched.h>

23 #include <linux/sysrq.h>

24 #include <linux/init.h>

25 #include <linux/nmi.h>

27 #define PANIC_TIMER_STEP 100

28 #define PANIC_BLINK_SPD 18

30 int panic_on_oops = CONFIG_PANIC_ON_OOPS_VALUE;

31 static unsigned long tainted_mask;

32 static int pause_on_oops;

33 static int pause_on_oops_flag;

34 static DEFINE_SPINLOCK(pause_on_oops_lock);

35 static bool crash_kexec_post_notifiers;

36 int panic_on_warn __read_mostly;

38 int panic_timeout = CONFIG_PANIC_TIMEOUT;

39 EXPORT_SYMBOL_GPL(panic_timeout);

41 ATOMIC_NOTIFIER_HEAD(panic_notifier_list);

43 EXPORT_SYMBOL(panic_notifier_list);

45 static long no_blink(int state)

46 {

47 return 0;

48 }

50 /* Returns how long it waited in ms */

51 long (*panic_blink)(int state);

52 EXPORT_SYMBOL(panic_blink);

54 /*

55 * Stop ourself in panic -- architecture code may override this

56 */

57 void __weak panic_smp_self_stop(void)

58 {

59 while (1)

60 cpu_relax();

61 }

63 atomic_t panic_cpu = ATOMIC_INIT(PANIC_CPU_INVALID);

65 /**

66 * panic - halt the system

67 * @fmt: The text string to print

68 *

69 * Display a message, then perform cleanups.

70 *

71 * This function never returns.

72 */

73 void panic(const char *fmt, ...)

74 {

75 static char buf[1024];

76 va_list args;

77 long i, i_next = 0;

78 int state = 0;

79 int old_cpu, this_cpu;

81 /*

82 * Disable local interrupts. This will prevent panic_smp_self_stop

83 * from deadlocking the first cpu that invokes the panic, since

84 * there is nothing to prevent an interrupt handler (that runs

85 * after setting panic_cpu) from invoking panic() again.

86 */

87 local_irq_disable();

89 /*

90 * It's possible to come here directly from a panic-assertion and

91 * not have preempt disabled. Some functions called from here want

92 * preempt to be disabled. No point enabling it later though...

93 *

94 * Only one CPU is allowed to execute the panic code from here. For

95 * multiple parallel invocations of panic, all other CPUs either

96 * stop themself or will wait until they are stopped by the 1st CPU

97 * with smp_send_stop().

98 *

99 * `old_cpu == PANIC_CPU_INVALID' means this is the 1st CPU which

100 * comes here, so go ahead.

101 * `old_cpu == this_cpu' means we came from nmi_panic() which sets

102 * panic_cpu to this CPU. In this case, this is also the 1st CPU.

103 */

104 this_cpu = raw_smp_processor_id();

105 old_cpu = atomic_cmpxchg(&panic_cpu, PANIC_CPU_INVALID, this_cpu);

106

107 if (old_cpu != PANIC_CPU_INVALID && old_cpu != this_cpu)

108 panic_smp_self_stop();

109

110 console_verbose();

111 bust_spinlocks(1);

112 va_start(args, fmt);

113 vsnprintf(buf, sizeof(buf), fmt, args);

114 va_end(args);

115 pr_emerg("Kernel panic - not syncing: %s\n", buf);

116 #ifdef CONFIG_DEBUG_BUGVERBOSE

117 /*

118 * Avoid nested stack-dumping if a panic occurs during oops processing

119 */

120 if (!test_taint(TAINT_DIE) && oops_in_progress <= 1)

121 dump_stack();

122 #endif

123

124 /*

125 * If we have crashed and we have a crash kernel loaded let it handle

126 * everything else.

127 * If we want to run this after calling panic_notifiers, pass

128 * the "crash_kexec_post_notifiers" option to the kernel.

129 */

130 if (!crash_kexec_post_notifiers)

131 crash_kexec(NULL);

132

133 /*

134 * Note smp_send_stop is the usual smp shutdown function, which

135 * unfortunately means it may not be hardened to work in a panic

136 * situation.

137 */

138 smp_send_stop();

139

140 /*

141 * Run any panic handlers, including those that might need to

142 * add information to the kmsg dump output.

143 */

144 atomic_notifier_call_chain(&panic_notifier_list, 0, buf);

145

146 kmsg_dump(KMSG_DUMP_PANIC);

147

148 /*

149 * If you doubt kdump always works fine in any situation,

150 * "crash_kexec_post_notifiers" offers you a chance to run

151 * panic_notifiers and dumping kmsg before kdump.

152 * Note: since some panic_notifiers can make crashed kernel

153 * more unstable, it can increase risks of the kdump failure too.

154 */

155 crash_kexec(NULL);

156

157 bust_spinlocks(0);

158

159 if (!panic_blink)

160 panic_blink = no_blink;

161

162 if (panic_timeout > 0) {

163 /*

164 * Delay timeout seconds before rebooting the machine.

165 * We can't use the "normal" timers since we just panicked.

166 */

167 pr_emerg("Rebooting in %d seconds..", panic_timeout);

168

169 for (i = 0; i < panic_timeout * 1000; i += PANIC_TIMER_STEP) {

170 touch_nmi_watchdog();

171 if (i >= i_next) {

172 i += panic_blink(state ^= 1);

173 i_next = i + 3600 / PANIC_BLINK_SPD;

174 }

175 mdelay(PANIC_TIMER_STEP);

176 }

177 }

178 if (panic_timeout != 0) {

179 /*

180 * This will not be a clean reboot, with everything

181 * shutting down. But if there is a chance of

182 * rebooting the system it will be rebooted.

183 */

184 emergency_restart();

185 }

186 #ifdef __sparc__

187 {

188 extern int stop_a_enabled;

189 /* Make sure the user can actually press Stop-A (L1-A) */

190 stop_a_enabled = 1;

191 pr_emerg("Press Stop-A (L1-A) to return to the boot prom\n");

192 }

193 #endif

194 #if defined(CONFIG_S390)

195 {

196 unsigned long caller;

197

198 caller = (unsigned long)__builtin_return_address(0);

199 disabled_wait(caller);

200 }

201 #endif

202 pr_emerg("---[ end Kernel panic - not syncing: %s\n", buf);

203 local_irq_enable();

204 for (i = 0; ; i += PANIC_TIMER_STEP) {

205 touch_softlockup_watchdog();

206 if (i >= i_next) {

207 i += panic_blink(state ^= 1);

208 i_next = i + 3600 / PANIC_BLINK_SPD;

209 }

210 mdelay(PANIC_TIMER_STEP);

211 }

212 }

213

214 EXPORT_SYMBOL(panic);

215

216

217 struct tnt {

218 u8 bit;

219 char true;

220 char false;

221 };

222

223 static const struct tnt tnts[] = {

224 { TAINT_PROPRIETARY_MODULE, 'P', 'G' },

225 { TAINT_FORCED_MODULE, 'F', ' ' },

226 { TAINT_CPU_OUT_OF_SPEC, 'S', ' ' },

227 { TAINT_FORCED_RMMOD, 'R', ' ' },

228 { TAINT_MACHINE_CHECK, 'M', ' ' },

229 { TAINT_BAD_PAGE, 'B', ' ' },

230 { TAINT_USER, 'U', ' ' },

231 { TAINT_DIE, 'D', ' ' },

232 { TAINT_OVERRIDDEN_ACPI_TABLE, 'A', ' ' },

233 { TAINT_WARN, 'W', ' ' },

234 { TAINT_CRAP, 'C', ' ' },

235 { TAINT_FIRMWARE_WORKAROUND, 'I', ' ' },

236 { TAINT_OOT_MODULE, 'O', ' ' },

237 { TAINT_UNSIGNED_MODULE, 'E', ' ' },

238 { TAINT_SOFTLOCKUP, 'L', ' ' },

239 { TAINT_LIVEPATCH, 'K', ' ' },

240 };

241

242 /**

243 * print_tainted - return a string to represent the kernel taint state.

244 *

245 * 'P' - Proprietary module has been loaded.

246 * 'F' - Module has been forcibly loaded.

247 * 'S' - SMP with CPUs not designed for SMP.

248 * 'R' - User forced a module unload.

249 * 'M' - System experienced a machine check exception.

250 * 'B' - System has hit bad_page.

251 * 'U' - Userspace-defined naughtiness.

252 * 'D' - Kernel has oopsed before

253 * 'A' - ACPI table overridden.

254 * 'W' - Taint on warning.

255 * 'C' - modules from drivers/staging are loaded.

256 * 'I' - Working around severe firmware bug.

257 * 'O' - Out-of-tree module has been loaded.

258 * 'E' - Unsigned module has been loaded.

259 * 'L' - A soft lockup has previously occurred.

260 * 'K' - Kernel has been live patched.

261 *

262 * The string is overwritten by the next call to print_tainted().

263 */

264 const char *print_tainted(void)

265 {

266 static char buf[ARRAY_SIZE(tnts) + sizeof("Tainted: ")];

267

268 if (tainted_mask) {

269 char *s;

270 int i;

271

272 s = buf + sprintf(buf, "Tainted: ");

273 for (i = 0; i < ARRAY_SIZE(tnts); i++) {

274 const struct tnt *t = &tnts[i];

275 *s++ = test_bit(t->bit, &tainted_mask) ?

276 t->true : t->false;

277 }

278 *s = 0;

279 } else

280 snprintf(buf, sizeof(buf), "Not tainted");

281

282 return buf;

283 }

284

285 int test_taint(unsigned flag)

286 {

287 return test_bit(flag, &tainted_mask);

288 }

289 EXPORT_SYMBOL(test_taint);

290

291 unsigned long get_taint(void)

292 {

293 return tainted_mask;

294 }

295

296 /**

297 * add_taint: add a taint flag if not already set.

298 * @flag: one of the TAINT_* constants.

299 * @lockdep_ok: whether lock debugging is still OK.

300 *

301 * If something bad has gone wrong, you'll want @lockdebug_ok = false, but for

302 * some notewortht-but-not-corrupting cases, it can be set to true.

303 */

304 void add_taint(unsigned flag, enum lockdep_ok lockdep_ok)

305 {

306 if (lockdep_ok == LOCKDEP_NOW_UNRELIABLE && __debug_locks_off())

307 pr_warn("Disabling lock debugging due to kernel taint\n");

308

309 set_bit(flag, &tainted_mask);

310 }

311 EXPORT_SYMBOL(add_taint);

312

313 static void spin_msec(int msecs)

314 {

315 int i;

316

317 for (i = 0; i < msecs; i++) {

318 touch_nmi_watchdog();

319 mdelay(1);

320 }

321 }

322

323 /*

324 * It just happens that oops_enter() and oops_exit() are identically

325 * implemented...

326 */

327 static void do_oops_enter_exit(void)

328 {

329 unsigned long flags;

330 static int spin_counter;

331

332 if (!pause_on_oops)

333 return;

334

335 spin_lock_irqsave(&pause_on_oops_lock, flags);

336 if (pause_on_oops_flag == 0) {

337 /* This CPU may now print the oops message */

338 pause_on_oops_flag = 1;

339 } else {

340 /* We need to stall this CPU */

341 if (!spin_counter) {

342 /* This CPU gets to do the counting */

343 spin_counter = pause_on_oops;

344 do {

345 spin_unlock(&pause_on_oops_lock);

346 spin_msec(MSEC_PER_SEC);

347 spin_lock(&pause_on_oops_lock);

348 } while (--spin_counter);

349 pause_on_oops_flag = 0;

350 } else {

351 /* This CPU waits for a different one */

352 while (spin_counter) {

353 spin_unlock(&pause_on_oops_lock);

354 spin_msec(1);

355 spin_lock(&pause_on_oops_lock);

356 }

357 }

358 }

359 spin_unlock_irqrestore(&pause_on_oops_lock, flags);

360 }

361

362 /*

363 * Return true if the calling CPU is allowed to print oops-related info.

364 * This is a bit racy..

365 */

366 int oops_may_print(void)

367 {

368 return pause_on_oops_flag == 0;

369 }

370

371 /*

372 * Called when the architecture enters its oops handler, before it prints

373 * anything. If this is the first CPU to oops, and it's oopsing the first

374 * time then let it proceed.

375 *

376 * This is all enabled by the pause_on_oops kernel boot option. We do all

377 * this to ensure that oopses don't scroll off the screen. It has the

378 * side-effect of preventing later-oopsing CPUs from mucking up the display,

379 * too.

380 *

381 * It turns out that the CPU which is allowed to print ends up pausing for

382 * the right duration, whereas all the other CPUs pause for twice as long:

383 * once in oops_enter(), once in oops_exit().

384 */

385 void oops_enter(void)

386 {

387 tracing_off();

388 /* can't trust the integrity of the kernel anymore: */

389 debug_locks_off();

390 do_oops_enter_exit();

391 }

392

393 /*

394 * 64-bit random ID for oopses:

395 */

396 static u64 oops_id;

397

398 static int init_oops_id(void)

399 {

400 if (!oops_id)

401 get_random_bytes(&oops_id, sizeof(oops_id));

402 else

403 oops_id++;

404

405 return 0;

406 }

407 late_initcall(init_oops_id);

408

409 void print_oops_end_marker(void)

410 {

411 init_oops_id();

412 pr_warn("---[ end trace %016llx ]---\n", (unsigned long long)oops_id);

413 }

414

415 /*

416 * Called when the architecture exits its oops handler, after printing

417 * everything.

418 */

419 void oops_exit(void)

420 {

421 do_oops_enter_exit();

422 print_oops_end_marker();

423 kmsg_dump(KMSG_DUMP_OOPS);

424 }

425

426 #ifdef WANT_WARN_ON_SLOWPATH

427 struct slowpath_args {

428 const char *fmt;

429 va_list args;

430 };

431

432 static void warn_slowpath_common(const char *file, int line, void *caller,

433 unsigned taint, struct slowpath_args *args)

434 {

435 disable_trace_on_warning();

436

437 pr_warn("------------[ cut here ]------------\n");

438 pr_warn("WARNING: CPU: %d PID: %d at %s:%d %pS()\n",

439 raw_smp_processor_id(), current->pid, file, line, caller);

440

441 if (args)

442 vprintk(args->fmt, args->args);

443

444 if (panic_on_warn) {

445 /*

446 * This thread may hit another WARN() in the panic path.

447 * Resetting this prevents additional WARN() from panicking the

448 * system on this thread. Other threads are blocked by the

449 * panic_mutex in panic().

450 */

451 panic_on_warn = 0;

452 panic("panic_on_warn set ...\n");

453 }

454

455 print_modules();

456 dump_stack();

457 print_oops_end_marker();

458 /* Just a warning, don't kill lockdep. */

459 add_taint(taint, LOCKDEP_STILL_OK);

460 }

461

462 void warn_slowpath_fmt(const char *file, int line, const char *fmt, ...)

463 {

464 struct slowpath_args args;

465

466 args.fmt = fmt;

467 va_start(args.args, fmt);

468 warn_slowpath_common(file, line, __builtin_return_address(0),

469 TAINT_WARN, &args);

470 va_end(args.args);

471 }

472 EXPORT_SYMBOL(warn_slowpath_fmt);

473

474 void warn_slowpath_fmt_taint(const char *file, int line,

475 unsigned taint, const char *fmt, ...)

476 {

477 struct slowpath_args args;

478

479 args.fmt = fmt;

480 va_start(args.args, fmt);

481 warn_slowpath_common(file, line, __builtin_return_address(0),

482 taint, &args);

483 va_end(args.args);

484 }

485 EXPORT_SYMBOL(warn_slowpath_fmt_taint);

486

487 void warn_slowpath_null(const char *file, int line)

488 {

489 warn_slowpath_common(file, line, __builtin_return_address(0),

490 TAINT_WARN, NULL);

491 }

492 EXPORT_SYMBOL(warn_slowpath_null);

493 #endif

494

495 #ifdef CONFIG_CC_STACKPROTECTOR

496

497 /*

498 * Called when gcc's -fstack-protector feature is used, and

499 * gcc detects corruption of the on-stack canary value

500 */

501 __visible void __stack_chk_fail(void)

502 {

503 panic("stack-protector: Kernel stack is corrupted in: %p\n",

504 __builtin_return_address(0));

505 }

506 EXPORT_SYMBOL(__stack_chk_fail);

507

508 #endif

509

510 core_param(panic, panic_timeout, int, 0644);

511 core_param(pause_on_oops, pause_on_oops, int, 0644);

512 core_param(panic_on_warn, panic_on_warn, int, 0644);

513

514 static int __init setup_crash_kexec_post_notifiers(char *s)

515 {

516 crash_kexec_post_notifiers = true;

517 return 0;

518 }

519 early_param("crash_kexec_post_notifiers", setup_crash_kexec_post_notifiers);

520

521 static int __init oops_setup(char *s)

522 {

523 if (!s)

524 return -EINVAL;

525 if (!strcmp(s, "panic"))

526 panic_on_oops = 1;

527 return 0;

528 }

529 early_param("oops", oops_setup);