 72640d8803
			
		
	
	
	72640d8803
	
	
	
		
			
			commit f96972f2dc "kernel/sys.c: call disable_nonboot_cpus() in
kernel_restart()"
added a call to disable_nonboot_cpus() on kernel_restart(), which tries
to shutdown all the CPUs except the first one. The issue with the PA
Semi, is that it does not support CPU hotplug.
When the call is made to __cpu_down(), it calls the notifiers
CPU_DOWN_PREPARE, and then tries to take the CPU down.
One of the notifiers to the CPU hotplug code, is the cpufreq. The
DOWN_PREPARE will call __cpufreq_remove_dev() which calls
cpufreq_driver->exit. The PA Semi exit handler unmaps regions of I/O
that is used by an interrupt that goes off constantly
(system_reset_common, but it goes off during normal system operations
too). I'm not sure exactly what this interrupt does.
Running a simple function trace, you can see it goes off quite a bit:
# tracer: function
#
#           TASK-PID    CPU#    TIMESTAMP  FUNCTION
#              | |       |          |         |
          <idle>-0     [001]  1558.859363: .pasemi_system_reset_exception <-.system_reset_exception
          <idle>-0     [000]  1558.860112: .pasemi_system_reset_exception <-.system_reset_exception
          <idle>-0     [000]  1558.861109: .pasemi_system_reset_exception <-.system_reset_exception
          <idle>-0     [001]  1558.861361: .pasemi_system_reset_exception <-.system_reset_exception
          <idle>-0     [000]  1558.861437: .pasemi_system_reset_exception <-.system_reset_exception
When the region is unmapped, the system crashes with:
Disabling non-boot CPUs ...
Error taking CPU1 down: -38
Unable to handle kernel paging request for data at address 0xd0000800903a0100
Faulting instruction address: 0xc000000000055fcc
Oops: Kernel access of bad area, sig: 11 [#1]
PREEMPT SMP NR_CPUS=64 NUMA PA Semi PWRficient
Modules linked in: shpchp
NIP: c000000000055fcc LR: c000000000055fb4 CTR: c0000000000df1fc
REGS: c0000000012175d0 TRAP: 0300   Not tainted  (3.8.0-rc4-test-dirty)
MSR: 9000000000009032 <SF,HV,EE,ME,IR,DR,RI>  CR: 24000088  XER: 00000000
SOFTE: 0
DAR: d0000800903a0100, DSISR: 42000000
TASK = c0000000010e9008[0] 'swapper/0' THREAD: c000000001214000 CPU: 0
GPR00: d0000800903a0000 c000000001217850 c0000000012167e0 0000000000000000
GPR04: 0000000000000000 0000000000000724 0000000000000724 0000000000000000
GPR08: 0000000000000000 0000000000000000 0000000000000001 0000000000a70000
GPR12: 0000000024000080 c00000000fff0000 ffffffffffffffff 000000003ffffae0
GPR16: ffffffffffffffff 0000000000a21198 0000000000000060 0000000000000000
GPR20: 00000000008fdd35 0000000000a21258 000000003ffffaf0 0000000000000417
GPR24: 0000000000a226d0 c000000000000000 0000000000000000 0000000000000000
GPR28: c00000000138b358 0000000000000000 c000000001144818 d0000800903a0100
NIP [c000000000055fcc] .set_astate+0x5c/0xa4
LR [c000000000055fb4] .set_astate+0x44/0xa4
Call Trace:
[c000000001217850] [c000000000055fb4] .set_astate+0x44/0xa4 (unreliable)
[c0000000012178f0] [c00000000005647c] .restore_astate+0x2c/0x34
[c000000001217980] [c000000000054668] .pasemi_system_reset_exception+0x6c/0x88
[c000000001217a00] [c000000000019ef0] .system_reset_exception+0x48/0x84
[c000000001217a80] [c000000000001e40] system_reset_common+0x140/0x180
Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
		
	
			
		
			
				
	
	
		
			331 lines
		
	
	
	
		
			7.5 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			331 lines
		
	
	
	
		
			7.5 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (C) 2007 PA Semi, Inc
 | |
|  *
 | |
|  * Authors: Egor Martovetsky <egor@pasemi.com>
 | |
|  *	    Olof Johansson <olof@lixom.net>
 | |
|  *
 | |
|  * Maintained by: Olof Johansson <olof@lixom.net>
 | |
|  *
 | |
|  * Based on arch/powerpc/platforms/cell/cbe_cpufreq.c:
 | |
|  * (C) Copyright IBM Deutschland Entwicklung GmbH 2005
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2, or (at your option)
 | |
|  * any later version.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program; if not, write to the Free Software
 | |
|  * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 | |
|  *
 | |
|  */
 | |
| 
 | |
| #include <linux/cpufreq.h>
 | |
| #include <linux/timer.h>
 | |
| #include <linux/module.h>
 | |
| 
 | |
| #include <asm/hw_irq.h>
 | |
| #include <asm/io.h>
 | |
| #include <asm/prom.h>
 | |
| #include <asm/time.h>
 | |
| #include <asm/smp.h>
 | |
| 
 | |
| #define SDCASR_REG		0x0100
 | |
| #define SDCASR_REG_STRIDE	0x1000
 | |
| #define SDCPWR_CFGA0_REG	0x0100
 | |
| #define SDCPWR_PWST0_REG	0x0000
 | |
| #define SDCPWR_GIZTIME_REG	0x0440
 | |
| 
 | |
| /* SDCPWR_GIZTIME_REG fields */
 | |
| #define SDCPWR_GIZTIME_GR	0x80000000
 | |
| #define SDCPWR_GIZTIME_LONGLOCK	0x000000ff
 | |
| 
 | |
| /* Offset of ASR registers from SDC base */
 | |
| #define SDCASR_OFFSET		0x120000
 | |
| 
 | |
| static void __iomem *sdcpwr_mapbase;
 | |
| static void __iomem *sdcasr_mapbase;
 | |
| 
 | |
| static DEFINE_MUTEX(pas_switch_mutex);
 | |
| 
 | |
| /* Current astate, is used when waking up from power savings on
 | |
|  * one core, in case the other core has switched states during
 | |
|  * the idle time.
 | |
|  */
 | |
| static int current_astate;
 | |
| 
 | |
| /* We support 5(A0-A4) power states excluding turbo(A5-A6) modes */
 | |
| static struct cpufreq_frequency_table pas_freqs[] = {
 | |
| 	{0,	0},
 | |
| 	{1,	0},
 | |
| 	{2,	0},
 | |
| 	{3,	0},
 | |
| 	{4,	0},
 | |
| 	{0,	CPUFREQ_TABLE_END},
 | |
| };
 | |
| 
 | |
| static struct freq_attr *pas_cpu_freqs_attr[] = {
 | |
| 	&cpufreq_freq_attr_scaling_available_freqs,
 | |
| 	NULL,
 | |
| };
 | |
| 
 | |
| /*
 | |
|  * hardware specific functions
 | |
|  */
 | |
| 
 | |
| static int get_astate_freq(int astate)
 | |
| {
 | |
| 	u32 ret;
 | |
| 	ret = in_le32(sdcpwr_mapbase + SDCPWR_CFGA0_REG + (astate * 0x10));
 | |
| 
 | |
| 	return ret & 0x3f;
 | |
| }
 | |
| 
 | |
| static int get_cur_astate(int cpu)
 | |
| {
 | |
| 	u32 ret;
 | |
| 
 | |
| 	ret = in_le32(sdcpwr_mapbase + SDCPWR_PWST0_REG);
 | |
| 	ret = (ret >> (cpu * 4)) & 0x7;
 | |
| 
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static int get_gizmo_latency(void)
 | |
| {
 | |
| 	u32 giztime, ret;
 | |
| 
 | |
| 	giztime = in_le32(sdcpwr_mapbase + SDCPWR_GIZTIME_REG);
 | |
| 
 | |
| 	/* just provide the upper bound */
 | |
| 	if (giztime & SDCPWR_GIZTIME_GR)
 | |
| 		ret = (giztime & SDCPWR_GIZTIME_LONGLOCK) * 128000;
 | |
| 	else
 | |
| 		ret = (giztime & SDCPWR_GIZTIME_LONGLOCK) * 1000;
 | |
| 
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static void set_astate(int cpu, unsigned int astate)
 | |
| {
 | |
| 	unsigned long flags;
 | |
| 
 | |
| 	/* Return if called before init has run */
 | |
| 	if (unlikely(!sdcasr_mapbase))
 | |
| 		return;
 | |
| 
 | |
| 	local_irq_save(flags);
 | |
| 
 | |
| 	out_le32(sdcasr_mapbase + SDCASR_REG + SDCASR_REG_STRIDE*cpu, astate);
 | |
| 
 | |
| 	local_irq_restore(flags);
 | |
| }
 | |
| 
 | |
| int check_astate(void)
 | |
| {
 | |
| 	return get_cur_astate(hard_smp_processor_id());
 | |
| }
 | |
| 
 | |
| void restore_astate(int cpu)
 | |
| {
 | |
| 	set_astate(cpu, current_astate);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * cpufreq functions
 | |
|  */
 | |
| 
 | |
| static int pas_cpufreq_cpu_init(struct cpufreq_policy *policy)
 | |
| {
 | |
| 	const u32 *max_freqp;
 | |
| 	u32 max_freq;
 | |
| 	int i, cur_astate;
 | |
| 	struct resource res;
 | |
| 	struct device_node *cpu, *dn;
 | |
| 	int err = -ENODEV;
 | |
| 
 | |
| 	cpu = of_get_cpu_node(policy->cpu, NULL);
 | |
| 
 | |
| 	if (!cpu)
 | |
| 		goto out;
 | |
| 
 | |
| 	dn = of_find_compatible_node(NULL, NULL, "1682m-sdc");
 | |
| 	if (!dn)
 | |
| 		dn = of_find_compatible_node(NULL, NULL,
 | |
| 					     "pasemi,pwrficient-sdc");
 | |
| 	if (!dn)
 | |
| 		goto out;
 | |
| 	err = of_address_to_resource(dn, 0, &res);
 | |
| 	of_node_put(dn);
 | |
| 	if (err)
 | |
| 		goto out;
 | |
| 	sdcasr_mapbase = ioremap(res.start + SDCASR_OFFSET, 0x2000);
 | |
| 	if (!sdcasr_mapbase) {
 | |
| 		err = -EINVAL;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	dn = of_find_compatible_node(NULL, NULL, "1682m-gizmo");
 | |
| 	if (!dn)
 | |
| 		dn = of_find_compatible_node(NULL, NULL,
 | |
| 					     "pasemi,pwrficient-gizmo");
 | |
| 	if (!dn) {
 | |
| 		err = -ENODEV;
 | |
| 		goto out_unmap_sdcasr;
 | |
| 	}
 | |
| 	err = of_address_to_resource(dn, 0, &res);
 | |
| 	of_node_put(dn);
 | |
| 	if (err)
 | |
| 		goto out_unmap_sdcasr;
 | |
| 	sdcpwr_mapbase = ioremap(res.start, 0x1000);
 | |
| 	if (!sdcpwr_mapbase) {
 | |
| 		err = -EINVAL;
 | |
| 		goto out_unmap_sdcasr;
 | |
| 	}
 | |
| 
 | |
| 	pr_debug("init cpufreq on CPU %d\n", policy->cpu);
 | |
| 
 | |
| 	max_freqp = of_get_property(cpu, "clock-frequency", NULL);
 | |
| 	if (!max_freqp) {
 | |
| 		err = -EINVAL;
 | |
| 		goto out_unmap_sdcpwr;
 | |
| 	}
 | |
| 
 | |
| 	/* we need the freq in kHz */
 | |
| 	max_freq = *max_freqp / 1000;
 | |
| 
 | |
| 	pr_debug("max clock-frequency is at %u kHz\n", max_freq);
 | |
| 	pr_debug("initializing frequency table\n");
 | |
| 
 | |
| 	/* initialize frequency table */
 | |
| 	for (i=0; pas_freqs[i].frequency!=CPUFREQ_TABLE_END; i++) {
 | |
| 		pas_freqs[i].frequency = get_astate_freq(pas_freqs[i].index) * 100000;
 | |
| 		pr_debug("%d: %d\n", i, pas_freqs[i].frequency);
 | |
| 	}
 | |
| 
 | |
| 	policy->cpuinfo.transition_latency = get_gizmo_latency();
 | |
| 
 | |
| 	cur_astate = get_cur_astate(policy->cpu);
 | |
| 	pr_debug("current astate is at %d\n",cur_astate);
 | |
| 
 | |
| 	policy->cur = pas_freqs[cur_astate].frequency;
 | |
| 	cpumask_copy(policy->cpus, cpu_online_mask);
 | |
| 
 | |
| 	ppc_proc_freq = policy->cur * 1000ul;
 | |
| 
 | |
| 	cpufreq_frequency_table_get_attr(pas_freqs, policy->cpu);
 | |
| 
 | |
| 	/* this ensures that policy->cpuinfo_min and policy->cpuinfo_max
 | |
| 	 * are set correctly
 | |
| 	 */
 | |
| 	return cpufreq_frequency_table_cpuinfo(policy, pas_freqs);
 | |
| 
 | |
| out_unmap_sdcpwr:
 | |
| 	iounmap(sdcpwr_mapbase);
 | |
| 
 | |
| out_unmap_sdcasr:
 | |
| 	iounmap(sdcasr_mapbase);
 | |
| out:
 | |
| 	return err;
 | |
| }
 | |
| 
 | |
| static int pas_cpufreq_cpu_exit(struct cpufreq_policy *policy)
 | |
| {
 | |
| 	/*
 | |
| 	 * We don't support CPU hotplug. Don't unmap after the system
 | |
| 	 * has already made it to a running state.
 | |
| 	 */
 | |
| 	if (system_state != SYSTEM_BOOTING)
 | |
| 		return 0;
 | |
| 
 | |
| 	if (sdcasr_mapbase)
 | |
| 		iounmap(sdcasr_mapbase);
 | |
| 	if (sdcpwr_mapbase)
 | |
| 		iounmap(sdcpwr_mapbase);
 | |
| 
 | |
| 	cpufreq_frequency_table_put_attr(policy->cpu);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int pas_cpufreq_verify(struct cpufreq_policy *policy)
 | |
| {
 | |
| 	return cpufreq_frequency_table_verify(policy, pas_freqs);
 | |
| }
 | |
| 
 | |
| static int pas_cpufreq_target(struct cpufreq_policy *policy,
 | |
| 			      unsigned int target_freq,
 | |
| 			      unsigned int relation)
 | |
| {
 | |
| 	struct cpufreq_freqs freqs;
 | |
| 	int pas_astate_new;
 | |
| 	int i;
 | |
| 
 | |
| 	cpufreq_frequency_table_target(policy,
 | |
| 				       pas_freqs,
 | |
| 				       target_freq,
 | |
| 				       relation,
 | |
| 				       &pas_astate_new);
 | |
| 
 | |
| 	freqs.old = policy->cur;
 | |
| 	freqs.new = pas_freqs[pas_astate_new].frequency;
 | |
| 	freqs.cpu = policy->cpu;
 | |
| 
 | |
| 	mutex_lock(&pas_switch_mutex);
 | |
| 	cpufreq_notify_transition(&freqs, CPUFREQ_PRECHANGE);
 | |
| 
 | |
| 	pr_debug("setting frequency for cpu %d to %d kHz, 1/%d of max frequency\n",
 | |
| 		 policy->cpu,
 | |
| 		 pas_freqs[pas_astate_new].frequency,
 | |
| 		 pas_freqs[pas_astate_new].index);
 | |
| 
 | |
| 	current_astate = pas_astate_new;
 | |
| 
 | |
| 	for_each_online_cpu(i)
 | |
| 		set_astate(i, pas_astate_new);
 | |
| 
 | |
| 	cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
 | |
| 	mutex_unlock(&pas_switch_mutex);
 | |
| 
 | |
| 	ppc_proc_freq = freqs.new * 1000ul;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static struct cpufreq_driver pas_cpufreq_driver = {
 | |
| 	.name		= "pas-cpufreq",
 | |
| 	.owner		= THIS_MODULE,
 | |
| 	.flags		= CPUFREQ_CONST_LOOPS,
 | |
| 	.init		= pas_cpufreq_cpu_init,
 | |
| 	.exit		= pas_cpufreq_cpu_exit,
 | |
| 	.verify		= pas_cpufreq_verify,
 | |
| 	.target		= pas_cpufreq_target,
 | |
| 	.attr		= pas_cpu_freqs_attr,
 | |
| };
 | |
| 
 | |
| /*
 | |
|  * module init and destoy
 | |
|  */
 | |
| 
 | |
| static int __init pas_cpufreq_init(void)
 | |
| {
 | |
| 	if (!of_machine_is_compatible("PA6T-1682M") &&
 | |
| 	    !of_machine_is_compatible("pasemi,pwrficient"))
 | |
| 		return -ENODEV;
 | |
| 
 | |
| 	return cpufreq_register_driver(&pas_cpufreq_driver);
 | |
| }
 | |
| 
 | |
| static void __exit pas_cpufreq_exit(void)
 | |
| {
 | |
| 	cpufreq_unregister_driver(&pas_cpufreq_driver);
 | |
| }
 | |
| 
 | |
| module_init(pas_cpufreq_init);
 | |
| module_exit(pas_cpufreq_exit);
 | |
| 
 | |
| MODULE_LICENSE("GPL");
 | |
| MODULE_AUTHOR("Egor Martovetsky <egor@pasemi.com>, Olof Johansson <olof@lixom.net>");
 |