| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * Persistent Storage - pstore.h | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Copyright (C) 2010 Intel Corporation <tony.luck@intel.com> | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This code is the generic layer to export data records from platform | 
					
						
							|  |  |  |  * level persistent storage via a file system. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  *  This program is free software; you can redistribute it and/or modify | 
					
						
							|  |  |  |  *  it under the terms of the GNU General Public License version 2 as | 
					
						
							|  |  |  |  *  published by the Free Software Foundation. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  *  This program is distributed in the hope that it will be useful, | 
					
						
							|  |  |  |  *  but WITHOUT ANY WARRANTY; without even the implied warranty of | 
					
						
							|  |  |  |  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
					
						
							|  |  |  |  *  GNU General Public License for more details. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  *  You should have received a copy of the GNU General Public License | 
					
						
							|  |  |  |  *  along with this program; if not, write to the Free Software | 
					
						
							|  |  |  |  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | #ifndef _LINUX_PSTORE_H
 | 
					
						
							|  |  |  | #define _LINUX_PSTORE_H
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-11-17 13:13:29 -08:00
										 |  |  | #include <linux/time.h>
 | 
					
						
							|  |  |  | #include <linux/kmsg_dump.h>
 | 
					
						
							| 
									
										
										
										
											2012-07-17 11:37:07 -07:00
										 |  |  | #include <linux/mutex.h>
 | 
					
						
							|  |  |  | #include <linux/types.h>
 | 
					
						
							|  |  |  | #include <linux/spinlock.h>
 | 
					
						
							|  |  |  | #include <linux/errno.h>
 | 
					
						
							| 
									
										
										
										
											2011-11-17 13:13:29 -08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | /* types */ | 
					
						
							|  |  |  | enum pstore_type_id { | 
					
						
							|  |  |  | 	PSTORE_TYPE_DMESG	= 0, | 
					
						
							|  |  |  | 	PSTORE_TYPE_MCE		= 1, | 
					
						
							| 
									
										
										
										
											2012-05-26 06:20:19 -07:00
										 |  |  | 	PSTORE_TYPE_CONSOLE	= 2, | 
					
						
							| 
									
										
										
										
											2012-07-09 17:10:41 -07:00
										 |  |  | 	PSTORE_TYPE_FTRACE	= 3, | 
					
						
							| 
									
										
										
										
											2013-06-06 00:21:44 +05:30
										 |  |  | 	/* PPC64 partition types */ | 
					
						
							|  |  |  | 	PSTORE_TYPE_PPC_RTAS	= 4, | 
					
						
							| 
									
										
										
										
											2013-06-06 00:22:10 +05:30
										 |  |  | 	PSTORE_TYPE_PPC_OF	= 5, | 
					
						
							| 
									
										
										
										
											2013-06-06 00:22:20 +05:30
										 |  |  | 	PSTORE_TYPE_PPC_COMMON	= 6, | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | 	PSTORE_TYPE_UNKNOWN	= 255 | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-07-17 11:37:07 -07:00
										 |  |  | struct module; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | struct pstore_info { | 
					
						
							|  |  |  | 	struct module	*owner; | 
					
						
							|  |  |  | 	char		*name; | 
					
						
							| 
									
										
										
										
											2011-08-12 10:54:51 -07:00
										 |  |  | 	spinlock_t	buf_lock;	/* serialize access to 'buf' */ | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | 	char		*buf; | 
					
						
							|  |  |  | 	size_t		bufsize; | 
					
						
							| 
									
										
										
										
											2011-11-17 12:58:07 -08:00
										 |  |  | 	struct mutex	read_mutex;	/* serialize open/read/close */ | 
					
						
							| 
									
										
										
										
											2011-05-16 11:00:27 -07:00
										 |  |  | 	int		(*open)(struct pstore_info *psi); | 
					
						
							|  |  |  | 	int		(*close)(struct pstore_info *psi); | 
					
						
							| 
									
										
										
										
											2011-05-16 10:58:57 -07:00
										 |  |  | 	ssize_t		(*read)(u64 *id, enum pstore_type_id *type, | 
					
						
							| 
									
										
											  
											
												efi_pstore: Add a sequence counter to a variable name
[Issue]
Currently, a variable name, which identifies each entry, consists of type, id and ctime.
But if multiple events happens in a short time, a second/third event may fail to log because
efi_pstore can't distinguish each event with current variable name.
[Solution]
A reasonable way to identify all events precisely is introducing a sequence counter to
the variable name.
The sequence counter has already supported in a pstore layer with "oopscount".
So, this patch adds it to a variable name.
Also, it is passed to read/erase callbacks of platform drivers in accordance with
the modification of the variable name.
  <before applying this patch>
 a variable name of first event: dump-type0-1-12345678
 a variable name of second event: dump-type0-1-12345678
  type:0
  id:1
  ctime:12345678
 If multiple events happen in a short time, efi_pstore can't distinguish them because
 variable names are same among them.
  <after applying this patch>
 it can be distinguishable by adding a sequence counter as follows.
 a variable name of first event: dump-type0-1-1-12345678
 a variable name of Second event: dump-type0-1-2-12345678
  type:0
  id:1
  sequence counter: 1(first event), 2(second event)
  ctime:12345678
In case of a write callback executed in pstore_console_write(), "0" is added to
an argument of the write callback because it just logs all kernel messages and
doesn't need to care about multiple events.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Acked-by: Rafael J. Wysocki <rafael.j.wysocki@intel.com>
Acked-by: Mike Waychison <mikew@google.com>
Signed-off-by: Tony Luck <tony.luck@intel.com>
											
										 
											2012-11-26 16:07:44 -08:00
										 |  |  | 			int *count, struct timespec *time, char **buf, | 
					
						
							| 
									
										
										
										
											2013-08-16 13:53:19 -07:00
										 |  |  | 			bool *compressed, struct pstore_info *psi); | 
					
						
							| 
									
										
										
										
											2011-11-17 13:13:29 -08:00
										 |  |  | 	int		(*write)(enum pstore_type_id type, | 
					
						
							|  |  |  | 			enum kmsg_dump_reason reason, u64 *id, | 
					
						
							| 
									
										
										
										
											2013-08-16 13:52:47 -07:00
										 |  |  | 			unsigned int part, int count, bool compressed, | 
					
						
							| 
									
										
										
										
											2013-06-27 14:02:56 +05:30
										 |  |  | 			size_t size, struct pstore_info *psi); | 
					
						
							| 
									
										
										
										
											2012-07-09 17:10:40 -07:00
										 |  |  | 	int		(*write_buf)(enum pstore_type_id type, | 
					
						
							|  |  |  | 			enum kmsg_dump_reason reason, u64 *id, | 
					
						
							| 
									
										
										
										
											2013-08-16 13:52:47 -07:00
										 |  |  | 			unsigned int part, const char *buf, bool compressed, | 
					
						
							| 
									
										
										
										
											2013-06-27 14:02:56 +05:30
										 |  |  | 			size_t size, struct pstore_info *psi); | 
					
						
							| 
									
										
										
										
											2011-07-21 16:57:53 -04:00
										 |  |  | 	int		(*erase)(enum pstore_type_id type, u64 id, | 
					
						
							| 
									
										
											  
											
												efi_pstore: Add a sequence counter to a variable name
[Issue]
Currently, a variable name, which identifies each entry, consists of type, id and ctime.
But if multiple events happens in a short time, a second/third event may fail to log because
efi_pstore can't distinguish each event with current variable name.
[Solution]
A reasonable way to identify all events precisely is introducing a sequence counter to
the variable name.
The sequence counter has already supported in a pstore layer with "oopscount".
So, this patch adds it to a variable name.
Also, it is passed to read/erase callbacks of platform drivers in accordance with
the modification of the variable name.
  <before applying this patch>
 a variable name of first event: dump-type0-1-12345678
 a variable name of second event: dump-type0-1-12345678
  type:0
  id:1
  ctime:12345678
 If multiple events happen in a short time, efi_pstore can't distinguish them because
 variable names are same among them.
  <after applying this patch>
 it can be distinguishable by adding a sequence counter as follows.
 a variable name of first event: dump-type0-1-1-12345678
 a variable name of Second event: dump-type0-1-2-12345678
  type:0
  id:1
  sequence counter: 1(first event), 2(second event)
  ctime:12345678
In case of a write callback executed in pstore_console_write(), "0" is added to
an argument of the write callback because it just logs all kernel messages and
doesn't need to care about multiple events.
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Acked-by: Rafael J. Wysocki <rafael.j.wysocki@intel.com>
Acked-by: Mike Waychison <mikew@google.com>
Signed-off-by: Tony Luck <tony.luck@intel.com>
											
										 
											2012-11-26 16:07:44 -08:00
										 |  |  | 			int count, struct timespec time, | 
					
						
							|  |  |  | 			struct pstore_info *psi); | 
					
						
							| 
									
										
										
										
											2011-07-21 16:57:52 -04:00
										 |  |  | 	void		*data; | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef CONFIG_PSTORE
 | 
					
						
							|  |  |  | extern int pstore_register(struct pstore_info *); | 
					
						
							| 
									
										
											  
											
												pstore: Avoid deadlock in panic and emergency-restart path
[Issue]
When pstore is in panic and emergency-restart paths, it may be blocked
in those paths because it simply takes spin_lock.
This is an example scenario which pstore may hang up in a panic path:
 - cpuA grabs psinfo->buf_lock
 - cpuB panics and calls smp_send_stop
 - smp_send_stop sends IRQ to cpuA
 - after 1 second, cpuB gives up on cpuA and sends an NMI instead
 - cpuA is now in an NMI handler while still holding buf_lock
 - cpuB is deadlocked
This case may happen if a firmware has a bug and
cpuA is stuck talking with it more than one second.
Also, this is a similar scenario in an emergency-restart path:
 - cpuA grabs psinfo->buf_lock and stucks in a firmware
 - cpuB kicks emergency-restart via either sysrq-b or hangcheck timer.
   And then, cpuB is deadlocked by taking psinfo->buf_lock again.
[Solution]
This patch avoids the deadlocking issues in both panic and emergency_restart
paths by introducing a function, is_non_blocking_path(), to check if a cpu
can be blocked in current path.
With this patch, pstore is not blocked even if another cpu has
taken a spin_lock, in those paths by changing from spin_lock_irqsave
to spin_trylock_irqsave.
In addition, according to a comment of emergency_restart() in kernel/sys.c,
spin_lock shouldn't be taken in an emergency_restart path to avoid
deadlock. This patch fits the comment below.
<snip>
/**
 *      emergency_restart - reboot the system
 *
 *      Without shutting down any hardware or taking any locks
 *      reboot the system.  This is called when we know we are in
 *      trouble so this is our best effort to reboot.  This is
 *      safe to call in interrupt context.
 */
void emergency_restart(void)
<snip>
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Acked-by: Don Zickus <dzickus@redhat.com>
Signed-off-by: Tony Luck <tony.luck@intel.com>
											
										 
											2013-01-11 18:09:41 +00:00
										 |  |  | extern bool pstore_cannot_block_path(enum kmsg_dump_reason reason); | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | #else
 | 
					
						
							|  |  |  | static inline int | 
					
						
							|  |  |  | pstore_register(struct pstore_info *psi) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return -ENODEV; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
											  
											
												pstore: Avoid deadlock in panic and emergency-restart path
[Issue]
When pstore is in panic and emergency-restart paths, it may be blocked
in those paths because it simply takes spin_lock.
This is an example scenario which pstore may hang up in a panic path:
 - cpuA grabs psinfo->buf_lock
 - cpuB panics and calls smp_send_stop
 - smp_send_stop sends IRQ to cpuA
 - after 1 second, cpuB gives up on cpuA and sends an NMI instead
 - cpuA is now in an NMI handler while still holding buf_lock
 - cpuB is deadlocked
This case may happen if a firmware has a bug and
cpuA is stuck talking with it more than one second.
Also, this is a similar scenario in an emergency-restart path:
 - cpuA grabs psinfo->buf_lock and stucks in a firmware
 - cpuB kicks emergency-restart via either sysrq-b or hangcheck timer.
   And then, cpuB is deadlocked by taking psinfo->buf_lock again.
[Solution]
This patch avoids the deadlocking issues in both panic and emergency_restart
paths by introducing a function, is_non_blocking_path(), to check if a cpu
can be blocked in current path.
With this patch, pstore is not blocked even if another cpu has
taken a spin_lock, in those paths by changing from spin_lock_irqsave
to spin_trylock_irqsave.
In addition, according to a comment of emergency_restart() in kernel/sys.c,
spin_lock shouldn't be taken in an emergency_restart path to avoid
deadlock. This patch fits the comment below.
<snip>
/**
 *      emergency_restart - reboot the system
 *
 *      Without shutting down any hardware or taking any locks
 *      reboot the system.  This is called when we know we are in
 *      trouble so this is our best effort to reboot.  This is
 *      safe to call in interrupt context.
 */
void emergency_restart(void)
<snip>
Signed-off-by: Seiji Aguchi <seiji.aguchi@hds.com>
Acked-by: Don Zickus <dzickus@redhat.com>
Signed-off-by: Tony Luck <tony.luck@intel.com>
											
										 
											2013-01-11 18:09:41 +00:00
										 |  |  | static inline bool | 
					
						
							|  |  |  | pstore_cannot_block_path(enum kmsg_dump_reason reason) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return false; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2010-12-28 14:25:21 -08:00
										 |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif /*_LINUX_PSTORE_H*/
 |