 b5aff55d89
			
		
	
	
	b5aff55d89
	
	
	
		
			
			The M7 processor has a different hypervisor group id and different PCR fast trap values. PIC read/write functions and PCR bit fields are the same as the T4 so those are reused. Signed-off-by: David Ahern <david.ahern@oracle.com> Acked-by: Bob Picco <bob.picco@oracle.com> Signed-off-by: David S. Miller <davem@davemloft.net>
		
			
				
	
	
		
			372 lines
		
	
	
	
		
			7.8 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			372 lines
		
	
	
	
		
			7.8 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
| /* pcr.c: Generic sparc64 performance counter infrastructure.
 | |
|  *
 | |
|  * Copyright (C) 2009 David S. Miller (davem@davemloft.net)
 | |
|  */
 | |
| #include <linux/kernel.h>
 | |
| #include <linux/export.h>
 | |
| #include <linux/init.h>
 | |
| #include <linux/irq.h>
 | |
| 
 | |
| #include <linux/irq_work.h>
 | |
| #include <linux/ftrace.h>
 | |
| 
 | |
| #include <asm/pil.h>
 | |
| #include <asm/pcr.h>
 | |
| #include <asm/nmi.h>
 | |
| #include <asm/asi.h>
 | |
| #include <asm/spitfire.h>
 | |
| 
 | |
| /* This code is shared between various users of the performance
 | |
|  * counters.  Users will be oprofile, pseudo-NMI watchdog, and the
 | |
|  * perf_event support layer.
 | |
|  */
 | |
| 
 | |
| /* Performance counter interrupts run unmasked at PIL level 15.
 | |
|  * Therefore we can't do things like wakeups and other work
 | |
|  * that expects IRQ disabling to be adhered to in locking etc.
 | |
|  *
 | |
|  * Therefore in such situations we defer the work by signalling
 | |
|  * a lower level cpu IRQ.
 | |
|  */
 | |
| void __irq_entry deferred_pcr_work_irq(int irq, struct pt_regs *regs)
 | |
| {
 | |
| 	struct pt_regs *old_regs;
 | |
| 
 | |
| 	clear_softint(1 << PIL_DEFERRED_PCR_WORK);
 | |
| 
 | |
| 	old_regs = set_irq_regs(regs);
 | |
| 	irq_enter();
 | |
| #ifdef CONFIG_IRQ_WORK
 | |
| 	irq_work_run();
 | |
| #endif
 | |
| 	irq_exit();
 | |
| 	set_irq_regs(old_regs);
 | |
| }
 | |
| 
 | |
| void arch_irq_work_raise(void)
 | |
| {
 | |
| 	set_softint(1 << PIL_DEFERRED_PCR_WORK);
 | |
| }
 | |
| 
 | |
| const struct pcr_ops *pcr_ops;
 | |
| EXPORT_SYMBOL_GPL(pcr_ops);
 | |
| 
 | |
| static u64 direct_pcr_read(unsigned long reg_num)
 | |
| {
 | |
| 	u64 val;
 | |
| 
 | |
| 	WARN_ON_ONCE(reg_num != 0);
 | |
| 	__asm__ __volatile__("rd %%pcr, %0" : "=r" (val));
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void direct_pcr_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	WARN_ON_ONCE(reg_num != 0);
 | |
| 	__asm__ __volatile__("wr %0, 0x0, %%pcr" : : "r" (val));
 | |
| }
 | |
| 
 | |
| static u64 direct_pic_read(unsigned long reg_num)
 | |
| {
 | |
| 	u64 val;
 | |
| 
 | |
| 	WARN_ON_ONCE(reg_num != 0);
 | |
| 	__asm__ __volatile__("rd %%pic, %0" : "=r" (val));
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void direct_pic_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	WARN_ON_ONCE(reg_num != 0);
 | |
| 
 | |
| 	/* Blackbird errata workaround.  See commentary in
 | |
| 	 * arch/sparc64/kernel/smp.c:smp_percpu_timer_interrupt()
 | |
| 	 * for more information.
 | |
| 	 */
 | |
| 	__asm__ __volatile__("ba,pt	%%xcc, 99f\n\t"
 | |
| 			     " nop\n\t"
 | |
| 			     ".align	64\n"
 | |
| 			  "99:wr	%0, 0x0, %%pic\n\t"
 | |
| 			     "rd	%%pic, %%g0" : : "r" (val));
 | |
| }
 | |
| 
 | |
| static u64 direct_picl_value(unsigned int nmi_hz)
 | |
| {
 | |
| 	u32 delta = local_cpu_data().clock_tick / nmi_hz;
 | |
| 
 | |
| 	return ((u64)((0 - delta) & 0xffffffff)) << 32;
 | |
| }
 | |
| 
 | |
| static const struct pcr_ops direct_pcr_ops = {
 | |
| 	.read_pcr		= direct_pcr_read,
 | |
| 	.write_pcr		= direct_pcr_write,
 | |
| 	.read_pic		= direct_pic_read,
 | |
| 	.write_pic		= direct_pic_write,
 | |
| 	.nmi_picl_value		= direct_picl_value,
 | |
| 	.pcr_nmi_enable		= (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE),
 | |
| 	.pcr_nmi_disable	= PCR_PIC_PRIV,
 | |
| };
 | |
| 
 | |
| static void n2_pcr_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	unsigned long ret;
 | |
| 
 | |
| 	WARN_ON_ONCE(reg_num != 0);
 | |
| 	if (val & PCR_N2_HTRACE) {
 | |
| 		ret = sun4v_niagara2_setperf(HV_N2_PERF_SPARC_CTL, val);
 | |
| 		if (ret != HV_EOK)
 | |
| 			direct_pcr_write(reg_num, val);
 | |
| 	} else
 | |
| 		direct_pcr_write(reg_num, val);
 | |
| }
 | |
| 
 | |
| static u64 n2_picl_value(unsigned int nmi_hz)
 | |
| {
 | |
| 	u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2);
 | |
| 
 | |
| 	return ((u64)((0 - delta) & 0xffffffff)) << 32;
 | |
| }
 | |
| 
 | |
| static const struct pcr_ops n2_pcr_ops = {
 | |
| 	.read_pcr		= direct_pcr_read,
 | |
| 	.write_pcr		= n2_pcr_write,
 | |
| 	.read_pic		= direct_pic_read,
 | |
| 	.write_pic		= direct_pic_write,
 | |
| 	.nmi_picl_value		= n2_picl_value,
 | |
| 	.pcr_nmi_enable		= (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE |
 | |
| 				   PCR_N2_TOE_OV1 |
 | |
| 				   (2 << PCR_N2_SL1_SHIFT) |
 | |
| 				   (0xff << PCR_N2_MASK1_SHIFT)),
 | |
| 	.pcr_nmi_disable	= PCR_PIC_PRIV,
 | |
| };
 | |
| 
 | |
| static u64 n4_pcr_read(unsigned long reg_num)
 | |
| {
 | |
| 	unsigned long val;
 | |
| 
 | |
| 	(void) sun4v_vt_get_perfreg(reg_num, &val);
 | |
| 
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void n4_pcr_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	(void) sun4v_vt_set_perfreg(reg_num, val);
 | |
| }
 | |
| 
 | |
| static u64 n4_pic_read(unsigned long reg_num)
 | |
| {
 | |
| 	unsigned long val;
 | |
| 
 | |
| 	__asm__ __volatile__("ldxa [%1] %2, %0"
 | |
| 			     : "=r" (val)
 | |
| 			     : "r" (reg_num * 0x8UL), "i" (ASI_PIC));
 | |
| 
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void n4_pic_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	__asm__ __volatile__("stxa %0, [%1] %2"
 | |
| 			     : /* no outputs */
 | |
| 			     : "r" (val), "r" (reg_num * 0x8UL), "i" (ASI_PIC));
 | |
| }
 | |
| 
 | |
| static u64 n4_picl_value(unsigned int nmi_hz)
 | |
| {
 | |
| 	u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2);
 | |
| 
 | |
| 	return ((u64)((0 - delta) & 0xffffffff));
 | |
| }
 | |
| 
 | |
| static const struct pcr_ops n4_pcr_ops = {
 | |
| 	.read_pcr		= n4_pcr_read,
 | |
| 	.write_pcr		= n4_pcr_write,
 | |
| 	.read_pic		= n4_pic_read,
 | |
| 	.write_pic		= n4_pic_write,
 | |
| 	.nmi_picl_value		= n4_picl_value,
 | |
| 	.pcr_nmi_enable		= (PCR_N4_PICNPT | PCR_N4_STRACE |
 | |
| 				   PCR_N4_UTRACE | PCR_N4_TOE |
 | |
| 				   (26 << PCR_N4_SL_SHIFT)),
 | |
| 	.pcr_nmi_disable	= PCR_N4_PICNPT,
 | |
| };
 | |
| 
 | |
| static u64 n5_pcr_read(unsigned long reg_num)
 | |
| {
 | |
| 	unsigned long val;
 | |
| 
 | |
| 	(void) sun4v_t5_get_perfreg(reg_num, &val);
 | |
| 
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void n5_pcr_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	(void) sun4v_t5_set_perfreg(reg_num, val);
 | |
| }
 | |
| 
 | |
| static const struct pcr_ops n5_pcr_ops = {
 | |
| 	.read_pcr		= n5_pcr_read,
 | |
| 	.write_pcr		= n5_pcr_write,
 | |
| 	.read_pic		= n4_pic_read,
 | |
| 	.write_pic		= n4_pic_write,
 | |
| 	.nmi_picl_value		= n4_picl_value,
 | |
| 	.pcr_nmi_enable		= (PCR_N4_PICNPT | PCR_N4_STRACE |
 | |
| 				   PCR_N4_UTRACE | PCR_N4_TOE |
 | |
| 				   (26 << PCR_N4_SL_SHIFT)),
 | |
| 	.pcr_nmi_disable	= PCR_N4_PICNPT,
 | |
| };
 | |
| 
 | |
| static u64 m7_pcr_read(unsigned long reg_num)
 | |
| {
 | |
| 	unsigned long val;
 | |
| 
 | |
| 	(void) sun4v_m7_get_perfreg(reg_num, &val);
 | |
| 
 | |
| 	return val;
 | |
| }
 | |
| 
 | |
| static void m7_pcr_write(unsigned long reg_num, u64 val)
 | |
| {
 | |
| 	(void) sun4v_m7_set_perfreg(reg_num, val);
 | |
| }
 | |
| 
 | |
| static const struct pcr_ops m7_pcr_ops = {
 | |
| 	.read_pcr		= m7_pcr_read,
 | |
| 	.write_pcr		= m7_pcr_write,
 | |
| 	.read_pic		= n4_pic_read,
 | |
| 	.write_pic		= n4_pic_write,
 | |
| 	.nmi_picl_value		= n4_picl_value,
 | |
| 	.pcr_nmi_enable		= (PCR_N4_PICNPT | PCR_N4_STRACE |
 | |
| 				   PCR_N4_UTRACE | PCR_N4_TOE |
 | |
| 				   (26 << PCR_N4_SL_SHIFT)),
 | |
| 	.pcr_nmi_disable	= PCR_N4_PICNPT,
 | |
| };
 | |
| 
 | |
| static unsigned long perf_hsvc_group;
 | |
| static unsigned long perf_hsvc_major;
 | |
| static unsigned long perf_hsvc_minor;
 | |
| 
 | |
| static int __init register_perf_hsvc(void)
 | |
| {
 | |
| 	unsigned long hverror;
 | |
| 
 | |
| 	if (tlb_type == hypervisor) {
 | |
| 		switch (sun4v_chip_type) {
 | |
| 		case SUN4V_CHIP_NIAGARA1:
 | |
| 			perf_hsvc_group = HV_GRP_NIAG_PERF;
 | |
| 			break;
 | |
| 
 | |
| 		case SUN4V_CHIP_NIAGARA2:
 | |
| 			perf_hsvc_group = HV_GRP_N2_CPU;
 | |
| 			break;
 | |
| 
 | |
| 		case SUN4V_CHIP_NIAGARA3:
 | |
| 			perf_hsvc_group = HV_GRP_KT_CPU;
 | |
| 			break;
 | |
| 
 | |
| 		case SUN4V_CHIP_NIAGARA4:
 | |
| 			perf_hsvc_group = HV_GRP_VT_CPU;
 | |
| 			break;
 | |
| 
 | |
| 		case SUN4V_CHIP_NIAGARA5:
 | |
| 			perf_hsvc_group = HV_GRP_T5_CPU;
 | |
| 			break;
 | |
| 
 | |
| 		case SUN4V_CHIP_SPARC_M7:
 | |
| 			perf_hsvc_group = HV_GRP_M7_PERF;
 | |
| 			break;
 | |
| 
 | |
| 		default:
 | |
| 			return -ENODEV;
 | |
| 		}
 | |
| 
 | |
| 
 | |
| 		perf_hsvc_major = 1;
 | |
| 		perf_hsvc_minor = 0;
 | |
| 		hverror = sun4v_hvapi_register(perf_hsvc_group,
 | |
| 					       perf_hsvc_major,
 | |
| 					       &perf_hsvc_minor);
 | |
| 		if (hverror) {
 | |
| 			pr_err("perfmon: Could not register hvapi(0x%lx).\n",
 | |
| 			       hverror);
 | |
| 			return -ENODEV;
 | |
| 		}
 | |
| 	}
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void __init unregister_perf_hsvc(void)
 | |
| {
 | |
| 	if (tlb_type != hypervisor)
 | |
| 		return;
 | |
| 	sun4v_hvapi_unregister(perf_hsvc_group);
 | |
| }
 | |
| 
 | |
| static int __init setup_sun4v_pcr_ops(void)
 | |
| {
 | |
| 	int ret = 0;
 | |
| 
 | |
| 	switch (sun4v_chip_type) {
 | |
| 	case SUN4V_CHIP_NIAGARA1:
 | |
| 	case SUN4V_CHIP_NIAGARA2:
 | |
| 	case SUN4V_CHIP_NIAGARA3:
 | |
| 		pcr_ops = &n2_pcr_ops;
 | |
| 		break;
 | |
| 
 | |
| 	case SUN4V_CHIP_NIAGARA4:
 | |
| 		pcr_ops = &n4_pcr_ops;
 | |
| 		break;
 | |
| 
 | |
| 	case SUN4V_CHIP_NIAGARA5:
 | |
| 		pcr_ops = &n5_pcr_ops;
 | |
| 		break;
 | |
| 
 | |
| 	case SUN4V_CHIP_SPARC_M7:
 | |
| 		pcr_ops = &m7_pcr_ops;
 | |
| 		break;
 | |
| 
 | |
| 	default:
 | |
| 		ret = -ENODEV;
 | |
| 		break;
 | |
| 	}
 | |
| 
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| int __init pcr_arch_init(void)
 | |
| {
 | |
| 	int err = register_perf_hsvc();
 | |
| 
 | |
| 	if (err)
 | |
| 		return err;
 | |
| 
 | |
| 	switch (tlb_type) {
 | |
| 	case hypervisor:
 | |
| 		err = setup_sun4v_pcr_ops();
 | |
| 		if (err)
 | |
| 			goto out_unregister;
 | |
| 		break;
 | |
| 
 | |
| 	case cheetah:
 | |
| 	case cheetah_plus:
 | |
| 		pcr_ops = &direct_pcr_ops;
 | |
| 		break;
 | |
| 
 | |
| 	case spitfire:
 | |
| 		/* UltraSPARC-I/II and derivatives lack a profile
 | |
| 		 * counter overflow interrupt so we can't make use of
 | |
| 		 * their hardware currently.
 | |
| 		 */
 | |
| 		/* fallthrough */
 | |
| 	default:
 | |
| 		err = -ENODEV;
 | |
| 		goto out_unregister;
 | |
| 	}
 | |
| 
 | |
| 	return nmi_init();
 | |
| 
 | |
| out_unregister:
 | |
| 	unregister_perf_hsvc();
 | |
| 	return err;
 | |
| }
 |