149 lines
		
	
	
	
		
			4.2 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			149 lines
		
	
	
	
		
			4.2 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
| 
								 | 
							
								/*
							 | 
						||
| 
								 | 
							
								 * Copyright 2010 Tilera Corporation. All Rights Reserved.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 *   This program is free software; you can redistribute it and/or
							 | 
						||
| 
								 | 
							
								 *   modify it under the terms of the GNU General Public License
							 | 
						||
| 
								 | 
							
								 *   as published by the Free Software Foundation, version 2.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 *   This program is distributed in the hope that it will be useful, but
							 | 
						||
| 
								 | 
							
								 *   WITHOUT ANY WARRANTY; without even the implied warranty of
							 | 
						||
| 
								 | 
							
								 *   MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or
							 | 
						||
| 
								 | 
							
								 *   NON INFRINGEMENT.  See the GNU General Public License for
							 | 
						||
| 
								 | 
							
								 *   more details.
							 | 
						||
| 
								 | 
							
								 */
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#ifndef _ASM_TILE_BARRIER_H
							 | 
						||
| 
								 | 
							
								#define _ASM_TILE_BARRIER_H
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#ifndef __ASSEMBLY__
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <linux/types.h>
							 | 
						||
| 
								 | 
							
								#include <arch/chip.h>
							 | 
						||
| 
								 | 
							
								#include <arch/spr_def.h>
							 | 
						||
| 
								 | 
							
								#include <asm/timex.h>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								/*
							 | 
						||
| 
								 | 
							
								 * read_barrier_depends - Flush all pending reads that subsequents reads
							 | 
						||
| 
								 | 
							
								 * depend on.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * No data-dependent reads from memory-like regions are ever reordered
							 | 
						||
| 
								 | 
							
								 * over this barrier.  All reads preceding this primitive are guaranteed
							 | 
						||
| 
								 | 
							
								 * to access memory (but not necessarily other CPUs' caches) before any
							 | 
						||
| 
								 | 
							
								 * reads following this primitive that depend on the data return by
							 | 
						||
| 
								 | 
							
								 * any of the preceding reads.  This primitive is much lighter weight than
							 | 
						||
| 
								 | 
							
								 * rmb() on most CPUs, and is never heavier weight than is
							 | 
						||
| 
								 | 
							
								 * rmb().
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * These ordering constraints are respected by both the local CPU
							 | 
						||
| 
								 | 
							
								 * and the compiler.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * Ordering is not guaranteed by anything other than these primitives,
							 | 
						||
| 
								 | 
							
								 * not even by data dependencies.  See the documentation for
							 | 
						||
| 
								 | 
							
								 * memory_barrier() for examples and URLs to more information.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * For example, the following code would force ordering (the initial
							 | 
						||
| 
								 | 
							
								 * value of "a" is zero, "b" is one, and "p" is "&a"):
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * <programlisting>
							 | 
						||
| 
								 | 
							
								 *	CPU 0				CPU 1
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 *	b = 2;
							 | 
						||
| 
								 | 
							
								 *	memory_barrier();
							 | 
						||
| 
								 | 
							
								 *	p = &b;				q = p;
							 | 
						||
| 
								 | 
							
								 *					read_barrier_depends();
							 | 
						||
| 
								 | 
							
								 *					d = *q;
							 | 
						||
| 
								 | 
							
								 * </programlisting>
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * because the read of "*q" depends on the read of "p" and these
							 | 
						||
| 
								 | 
							
								 * two reads are separated by a read_barrier_depends().  However,
							 | 
						||
| 
								 | 
							
								 * the following code, with the same initial values for "a" and "b":
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * <programlisting>
							 | 
						||
| 
								 | 
							
								 *	CPU 0				CPU 1
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 *	a = 2;
							 | 
						||
| 
								 | 
							
								 *	memory_barrier();
							 | 
						||
| 
								 | 
							
								 *	b = 3;				y = b;
							 | 
						||
| 
								 | 
							
								 *					read_barrier_depends();
							 | 
						||
| 
								 | 
							
								 *					x = a;
							 | 
						||
| 
								 | 
							
								 * </programlisting>
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * does not enforce ordering, since there is no data dependency between
							 | 
						||
| 
								 | 
							
								 * the read of "a" and the read of "b".  Therefore, on some CPUs, such
							 | 
						||
| 
								 | 
							
								 * as Alpha, "y" could be set to 3 and "x" to 0.  Use rmb()
							 | 
						||
| 
								 | 
							
								 * in cases like this where there are no data dependencies.
							 | 
						||
| 
								 | 
							
								 */
							 | 
						||
| 
								 | 
							
								#define read_barrier_depends()	do { } while (0)
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#define __sync()	__insn_mf()
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#if !CHIP_HAS_MF_WAITS_FOR_VICTIMS()
							 | 
						||
| 
								 | 
							
								#include <hv/syscall_public.h>
							 | 
						||
| 
								 | 
							
								/*
							 | 
						||
| 
								 | 
							
								 * Issue an uncacheable load to each memory controller, then
							 | 
						||
| 
								 | 
							
								 * wait until those loads have completed.
							 | 
						||
| 
								 | 
							
								 */
							 | 
						||
| 
								 | 
							
								static inline void __mb_incoherent(void)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
									long clobber_r10;
							 | 
						||
| 
								 | 
							
									asm volatile("swint2"
							 | 
						||
| 
								 | 
							
										     : "=R10" (clobber_r10)
							 | 
						||
| 
								 | 
							
										     : "R10" (HV_SYS_fence_incoherent)
							 | 
						||
| 
								 | 
							
										     : "r0", "r1", "r2", "r3", "r4",
							 | 
						||
| 
								 | 
							
										       "r5", "r6", "r7", "r8", "r9",
							 | 
						||
| 
								 | 
							
										       "r11", "r12", "r13", "r14",
							 | 
						||
| 
								 | 
							
										       "r15", "r16", "r17", "r18", "r19",
							 | 
						||
| 
								 | 
							
										       "r20", "r21", "r22", "r23", "r24",
							 | 
						||
| 
								 | 
							
										       "r25", "r26", "r27", "r28", "r29");
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								#endif
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								/* Fence to guarantee visibility of stores to incoherent memory. */
							 | 
						||
| 
								 | 
							
								static inline void
							 | 
						||
| 
								 | 
							
								mb_incoherent(void)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
									__insn_mf();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#if !CHIP_HAS_MF_WAITS_FOR_VICTIMS()
							 | 
						||
| 
								 | 
							
									{
							 | 
						||
| 
								 | 
							
								#if CHIP_HAS_TILE_WRITE_PENDING()
							 | 
						||
| 
								 | 
							
										const unsigned long WRITE_TIMEOUT_CYCLES = 400;
							 | 
						||
| 
								 | 
							
										unsigned long start = get_cycles_low();
							 | 
						||
| 
								 | 
							
										do {
							 | 
						||
| 
								 | 
							
											if (__insn_mfspr(SPR_TILE_WRITE_PENDING) == 0)
							 | 
						||
| 
								 | 
							
												return;
							 | 
						||
| 
								 | 
							
										} while ((get_cycles_low() - start) < WRITE_TIMEOUT_CYCLES);
							 | 
						||
| 
								 | 
							
								#endif /* CHIP_HAS_TILE_WRITE_PENDING() */
							 | 
						||
| 
								 | 
							
										(void) __mb_incoherent();
							 | 
						||
| 
								 | 
							
									}
							 | 
						||
| 
								 | 
							
								#endif /* CHIP_HAS_MF_WAITS_FOR_VICTIMS() */
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#define fast_wmb()	__sync()
							 | 
						||
| 
								 | 
							
								#define fast_rmb()	__sync()
							 | 
						||
| 
								 | 
							
								#define fast_mb()	__sync()
							 | 
						||
| 
								 | 
							
								#define fast_iob()	mb_incoherent()
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#define wmb()		fast_wmb()
							 | 
						||
| 
								 | 
							
								#define rmb()		fast_rmb()
							 | 
						||
| 
								 | 
							
								#define mb()		fast_mb()
							 | 
						||
| 
								 | 
							
								#define iob()		fast_iob()
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#ifdef CONFIG_SMP
							 | 
						||
| 
								 | 
							
								#define smp_mb()	mb()
							 | 
						||
| 
								 | 
							
								#define smp_rmb()	rmb()
							 | 
						||
| 
								 | 
							
								#define smp_wmb()	wmb()
							 | 
						||
| 
								 | 
							
								#define smp_read_barrier_depends()	read_barrier_depends()
							 | 
						||
| 
								 | 
							
								#else
							 | 
						||
| 
								 | 
							
								#define smp_mb()	barrier()
							 | 
						||
| 
								 | 
							
								#define smp_rmb()	barrier()
							 | 
						||
| 
								 | 
							
								#define smp_wmb()	barrier()
							 | 
						||
| 
								 | 
							
								#define smp_read_barrier_depends()	do { } while (0)
							 | 
						||
| 
								 | 
							
								#endif
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#define set_mb(var, value) \
							 | 
						||
| 
								 | 
							
									do { var = value; mb(); } while (0)
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#endif /* !__ASSEMBLY__ */
							 | 
						||
| 
								 | 
							
								#endif /* _ASM_TILE_BARRIER_H */
							 |