| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  |  /*
 | 
					
						
							|  |  |  |  * Cell Broadband Engine OProfile Support | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * (C) Copyright IBM Corporation 2006 | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Author: Maynard Johnson <maynardj@us.ibm.com> | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This program is free software; you can redistribute it and/or | 
					
						
							|  |  |  |  * modify it under the terms of the GNU General Public License | 
					
						
							|  |  |  |  * as published by the Free Software Foundation; either version | 
					
						
							|  |  |  |  * 2 of the License, or (at your option) any later version. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifndef PR_UTIL_H
 | 
					
						
							|  |  |  | #define PR_UTIL_H
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <linux/cpumask.h>
 | 
					
						
							|  |  |  | #include <linux/oprofile.h>
 | 
					
						
							|  |  |  | #include <asm/cell-pmu.h>
 | 
					
						
							| 
									
										
										
										
											2007-10-04 15:40:42 +10:00
										 |  |  | #include <asm/cell-regs.h>
 | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | #include <asm/spu.h>
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* Defines used for sync_start */ | 
					
						
							|  |  |  | #define SKIP_GENERIC_SYNC 0
 | 
					
						
							|  |  |  | #define SYNC_START_ERROR -1
 | 
					
						
							|  |  |  | #define DO_GENERIC_SYNC 1
 | 
					
						
							| 
									
										
										
										
											2008-10-14 23:37:01 +00:00
										 |  |  | #define SPUS_PER_NODE   8
 | 
					
						
							|  |  |  | #define DEFAULT_TIMER_EXPIRE  (HZ / 10)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | extern struct delayed_work spu_work; | 
					
						
							|  |  |  | extern int spu_prof_running; | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-12-01 16:18:36 -08:00
										 |  |  | #define TRACE_ARRAY_SIZE 1024
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | extern spinlock_t oprof_spu_smpl_arry_lck; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | struct spu_overlay_info {	/* map of sections within an SPU overlay */ | 
					
						
							|  |  |  | 	unsigned int vma;	/* SPU virtual memory address from elf */ | 
					
						
							|  |  |  | 	unsigned int size;	/* size of section from elf */ | 
					
						
							|  |  |  | 	unsigned int offset;	/* offset of section into elf file */ | 
					
						
							|  |  |  | 	unsigned int buf; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct vma_to_fileoffset_map {	/* map of sections within an SPU program */ | 
					
						
							|  |  |  | 	struct vma_to_fileoffset_map *next;	/* list pointer */ | 
					
						
							|  |  |  | 	unsigned int vma;	/* SPU virtual memory address from elf */ | 
					
						
							|  |  |  | 	unsigned int size;	/* size of section from elf */ | 
					
						
							|  |  |  | 	unsigned int offset;	/* offset of section into elf file */ | 
					
						
							|  |  |  | 	unsigned int guard_ptr; | 
					
						
							|  |  |  | 	unsigned int guard_val; | 
					
						
							|  |  |  |         /*
 | 
					
						
							|  |  |  | 	 * The guard pointer is an entry in the _ovly_buf_table, | 
					
						
							|  |  |  | 	 * computed using ovly.buf as the index into the table.  Since | 
					
						
							|  |  |  | 	 * ovly.buf values begin at '1' to reference the first (or 0th) | 
					
						
							|  |  |  | 	 * entry in the _ovly_buf_table, the computation subtracts 1 | 
					
						
							|  |  |  | 	 * from ovly.buf. | 
					
						
							|  |  |  | 	 * The guard value is stored in the _ovly_buf_table entry and | 
					
						
							|  |  |  | 	 * is an index (starting at 1) back to the _ovly_table entry | 
					
						
							|  |  |  | 	 * that is pointing at this _ovly_buf_table entry.  So, for | 
					
						
							|  |  |  | 	 * example, for an overlay scenario with one overlay segment | 
					
						
							|  |  |  | 	 * and two overlay sections: | 
					
						
							|  |  |  | 	 *      - Section 1 points to the first entry of the | 
					
						
							|  |  |  | 	 *        _ovly_buf_table, which contains a guard value | 
					
						
							|  |  |  | 	 *        of '1', referencing the first (index=0) entry of | 
					
						
							|  |  |  | 	 *        _ovly_table. | 
					
						
							|  |  |  | 	 *      - Section 2 points to the second entry of the | 
					
						
							|  |  |  | 	 *        _ovly_buf_table, which contains a guard value | 
					
						
							|  |  |  | 	 *        of '2', referencing the second (index=1) entry of | 
					
						
							|  |  |  | 	 *        _ovly_table. | 
					
						
							|  |  |  | 	 */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-10-14 23:37:01 +00:00
										 |  |  | struct spu_buffer { | 
					
						
							|  |  |  | 	int last_guard_val; | 
					
						
							|  |  |  | 	int ctx_sw_seen; | 
					
						
							|  |  |  | 	unsigned long *buff; | 
					
						
							|  |  |  | 	unsigned int head, tail; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | /* The three functions below are for maintaining and accessing
 | 
					
						
							|  |  |  |  * the vma-to-fileoffset map. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | struct vma_to_fileoffset_map *create_vma_map(const struct spu *spu, | 
					
						
							| 
									
										
										
										
											2009-01-06 13:58:22 +00:00
										 |  |  | 					     unsigned long objectid); | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | unsigned int vma_map_lookup(struct vma_to_fileoffset_map *map, | 
					
						
							|  |  |  | 			    unsigned int vma, const struct spu *aSpu, | 
					
						
							|  |  |  | 			    int *grd_val); | 
					
						
							|  |  |  | void vma_map_free(struct vma_to_fileoffset_map *map); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /*
 | 
					
						
							|  |  |  |  * Entry point for SPU profiling. | 
					
						
							|  |  |  |  * cycles_reset is the SPU_CYCLES count value specified by the user. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2009-01-08 15:29:47 +01:00
										 |  |  | int start_spu_profiling_cycles(unsigned int cycles_reset); | 
					
						
							| 
									
										
										
										
											2008-12-01 16:18:36 -08:00
										 |  |  | void start_spu_profiling_events(void); | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2009-01-08 15:29:47 +01:00
										 |  |  | void stop_spu_profiling_cycles(void); | 
					
						
							| 
									
										
										
										
											2008-12-01 16:18:36 -08:00
										 |  |  | void stop_spu_profiling_events(void); | 
					
						
							| 
									
										
										
										
											2007-07-20 21:39:53 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* add the necessary profiling hooks */ | 
					
						
							|  |  |  | int spu_sync_start(void); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* remove the hooks */ | 
					
						
							|  |  |  | int spu_sync_stop(void); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* Record SPU program counter samples to the oprofile event buffer. */ | 
					
						
							|  |  |  | void spu_sync_buffer(int spu_num, unsigned int *samples, | 
					
						
							|  |  |  | 		     int num_samples); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void set_spu_profiling_frequency(unsigned int freq_khz, unsigned int cycles_reset); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif	  /* PR_UTIL_H */
 |