 a086536858
			
		
	
	
	a086536858
	
	
	
		
			
			A strange variation was seen in the BogoMIPS figure for the ST40-300. This was eventually tracked down to sensitivity to the alignment of the loop. So add an align directive to ensure this doesn't occur. Signed-off-by: Stuart Menefy <stuart.menefy@st.com> Signed-off-by: Paul Mundt <lethal@linux-sh.org>
		
			
				
	
	
		
			53 lines
		
	
	
	
		
			1 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			53 lines
		
	
	
	
		
			1 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  *	Precise Delay Loops for SuperH
 | |
|  *
 | |
|  *	Copyright (C) 1999 Niibe Yutaka & Kaz Kojima
 | |
|  */
 | |
| 
 | |
| #include <linux/sched.h>
 | |
| #include <linux/delay.h>
 | |
| 
 | |
| void __delay(unsigned long loops)
 | |
| {
 | |
| 	__asm__ __volatile__(
 | |
| 		/*
 | |
| 		 * ST40-300 appears to have an issue with this code,
 | |
| 		 * normally taking two cycles each loop, as with all
 | |
| 		 * other SH variants. If however the branch and the
 | |
| 		 * delay slot straddle an 8 byte boundary, this increases
 | |
| 		 * to 3 cycles.
 | |
| 		 * This align directive ensures this doesn't occur.
 | |
| 		 */
 | |
| 		".balign 8\n\t"
 | |
| 
 | |
| 		"tst	%0, %0\n\t"
 | |
| 		"1:\t"
 | |
| 		"bf/s	1b\n\t"
 | |
| 		" dt	%0"
 | |
| 		: "=r" (loops)
 | |
| 		: "0" (loops)
 | |
| 		: "t");
 | |
| }
 | |
| 
 | |
| inline void __const_udelay(unsigned long xloops)
 | |
| {
 | |
| 	xloops *= 4;
 | |
| 	__asm__("dmulu.l	%0, %2\n\t"
 | |
| 		"sts	mach, %0"
 | |
| 		: "=r" (xloops)
 | |
| 		: "0" (xloops),
 | |
| 		  "r" (cpu_data[raw_smp_processor_id()].loops_per_jiffy * (HZ/4))
 | |
| 		: "macl", "mach");
 | |
| 	__delay(++xloops);
 | |
| }
 | |
| 
 | |
| void __udelay(unsigned long usecs)
 | |
| {
 | |
| 	__const_udelay(usecs * 0x000010c6);  /* 2**32 / 1000000 */
 | |
| }
 | |
| 
 | |
| void __ndelay(unsigned long nsecs)
 | |
| {
 | |
| 	__const_udelay(nsecs * 0x00000005);
 | |
| }
 | |
| 
 |