 e4f30545a2
			
		
	
	
	e4f30545a2
	
	
	
		
			
			- Additional cache flushing during boot (needed in the presence of
   external caches or under virtualisation)
 - DMA range invalidation fix for non cache line aligned buffers
 - Build failure fix with !COMPAT
 - Kconfig update for STRICT_DEVMEM
 -----BEGIN PGP SIGNATURE-----
 Version: GnuPG v1.4.9 (GNU/Linux)
 
 iQIcBAABAgAGBQJTRDI8AAoJEGvWsS0AyF7xx2IP/jgBjjeIII7L6T45dG3BeJR1
 ph8CBfnsHK3wr5KXiFrdQ2mhAWFr44SLNOd9xuZZmzpA/QWlyqaH46+oqz2GozUf
 y2HucJoEIO+wXMFscQ/EQDiT4uUSbEXBQ6JeZzrhCgVaXeSs+wkKTtGXkxEh2gWo
 w4OI1/JX7phv4heim51aabzziQ3o9JziIs6hALv6OVZVsuPF/TX+mK8C2ejJWLnv
 ou+6E6iv69wNrgPnM3fcKj1CDisCNdFVvjd2LwzkJS7MUra74SWoXczCbfBYW6Ty
 1GgZ/t3TOluDoaLgXfGyQXxnhOUyHdV16034/k8wISfuXG59V0eT+CaCgAotftKD
 5oH+P4MfyVOvZpILrRtY/4MajlCr4V1RnzSYKnS/h3zzHW7Cx/BtYbbQEOVQnZwc
 Gh4adLqc0f8QtkD4zGI7UWmxPxiI9KX9EEpVDAU3TJw6FjVSp7qZ1ifajsWc201h
 STzQEu8LDBWQY2WKrtZxXvFjZj4eSSXNaDHNVCugODk2FBU6wNv4P5q1S+23xt+G
 rR9UI8a0mpginNvhnwHoIR6X+RW3CDaUzn9k3gaJWDWvGoTeuAIstdyxCn6Dm26c
 XF2B5xf5SdxXeNv513WfULCyLgJmLs9CzVFybgYWKLciLbLn7f3pAiisHuO1DWvu
 Gv+70wfYArAcbkGPw5Qt
 =mDkd
 -----END PGP SIGNATURE-----
Merge tag 'arm64-upstream' of git://git.kernel.org/pub/scm/linux/kernel/git/arm64/linux
Pull second set of arm64 updates from Catalin Marinas:
 "A second pull request for this merging window, mainly with fixes and
  docs clarification:
   - Documentation clarification on CPU topology and booting
     requirements
   - Additional cache flushing during boot (needed in the presence of
     external caches or under virtualisation)
   - DMA range invalidation fix for non cache line aligned buffers
   - Build failure fix with !COMPAT
   - Kconfig update for STRICT_DEVMEM"
* tag 'arm64-upstream' of git://git.kernel.org/pub/scm/linux/kernel/git/arm64/linux:
  arm64: Fix DMA range invalidation for cache line unaligned buffers
  arm64: Add missing Kconfig for CONFIG_STRICT_DEVMEM
  arm64: fix !CONFIG_COMPAT build failures
  Revert "arm64: virt: ensure visibility of __boot_cpu_mode"
  arm64: Relax the kernel cache requirements for boot
  arm64: Update the TCR_EL1 translation granule definitions for 16K pages
  ARM: topology: Make it clear that all CPUs need to be described
		
	
			
		
			
				
	
	
		
			600 lines
		
	
	
	
		
			16 KiB
			
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			600 lines
		
	
	
	
		
			16 KiB
			
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
| /*
 | |
|  * Low-level CPU initialisation
 | |
|  * Based on arch/arm/kernel/head.S
 | |
|  *
 | |
|  * Copyright (C) 1994-2002 Russell King
 | |
|  * Copyright (C) 2003-2012 ARM Ltd.
 | |
|  * Authors:	Catalin Marinas <catalin.marinas@arm.com>
 | |
|  *		Will Deacon <will.deacon@arm.com>
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License version 2 as
 | |
|  * published by the Free Software Foundation.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 | |
|  */
 | |
| 
 | |
| #include <linux/linkage.h>
 | |
| #include <linux/init.h>
 | |
| 
 | |
| #include <asm/assembler.h>
 | |
| #include <asm/ptrace.h>
 | |
| #include <asm/asm-offsets.h>
 | |
| #include <asm/cache.h>
 | |
| #include <asm/cputype.h>
 | |
| #include <asm/memory.h>
 | |
| #include <asm/thread_info.h>
 | |
| #include <asm/pgtable-hwdef.h>
 | |
| #include <asm/pgtable.h>
 | |
| #include <asm/page.h>
 | |
| #include <asm/virt.h>
 | |
| 
 | |
| /*
 | |
|  * swapper_pg_dir is the virtual address of the initial page table. We place
 | |
|  * the page tables 3 * PAGE_SIZE below KERNEL_RAM_VADDR. The idmap_pg_dir has
 | |
|  * 2 pages and is placed below swapper_pg_dir.
 | |
|  */
 | |
| #define KERNEL_RAM_VADDR	(PAGE_OFFSET + TEXT_OFFSET)
 | |
| 
 | |
| #if (KERNEL_RAM_VADDR & 0xfffff) != 0x80000
 | |
| #error KERNEL_RAM_VADDR must start at 0xXXX80000
 | |
| #endif
 | |
| 
 | |
| #define SWAPPER_DIR_SIZE	(3 * PAGE_SIZE)
 | |
| #define IDMAP_DIR_SIZE		(2 * PAGE_SIZE)
 | |
| 
 | |
| 	.globl	swapper_pg_dir
 | |
| 	.equ	swapper_pg_dir, KERNEL_RAM_VADDR - SWAPPER_DIR_SIZE
 | |
| 
 | |
| 	.globl	idmap_pg_dir
 | |
| 	.equ	idmap_pg_dir, swapper_pg_dir - IDMAP_DIR_SIZE
 | |
| 
 | |
| 	.macro	pgtbl, ttb0, ttb1, phys
 | |
| 	add	\ttb1, \phys, #TEXT_OFFSET - SWAPPER_DIR_SIZE
 | |
| 	sub	\ttb0, \ttb1, #IDMAP_DIR_SIZE
 | |
| 	.endm
 | |
| 
 | |
| #ifdef CONFIG_ARM64_64K_PAGES
 | |
| #define BLOCK_SHIFT	PAGE_SHIFT
 | |
| #define BLOCK_SIZE	PAGE_SIZE
 | |
| #else
 | |
| #define BLOCK_SHIFT	SECTION_SHIFT
 | |
| #define BLOCK_SIZE	SECTION_SIZE
 | |
| #endif
 | |
| 
 | |
| #define KERNEL_START	KERNEL_RAM_VADDR
 | |
| #define KERNEL_END	_end
 | |
| 
 | |
| /*
 | |
|  * Initial memory map attributes.
 | |
|  */
 | |
| #ifndef CONFIG_SMP
 | |
| #define PTE_FLAGS	PTE_TYPE_PAGE | PTE_AF
 | |
| #define PMD_FLAGS	PMD_TYPE_SECT | PMD_SECT_AF
 | |
| #else
 | |
| #define PTE_FLAGS	PTE_TYPE_PAGE | PTE_AF | PTE_SHARED
 | |
| #define PMD_FLAGS	PMD_TYPE_SECT | PMD_SECT_AF | PMD_SECT_S
 | |
| #endif
 | |
| 
 | |
| #ifdef CONFIG_ARM64_64K_PAGES
 | |
| #define MM_MMUFLAGS	PTE_ATTRINDX(MT_NORMAL) | PTE_FLAGS
 | |
| #else
 | |
| #define MM_MMUFLAGS	PMD_ATTRINDX(MT_NORMAL) | PMD_FLAGS
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|  * Kernel startup entry point.
 | |
|  * ---------------------------
 | |
|  *
 | |
|  * The requirements are:
 | |
|  *   MMU = off, D-cache = off, I-cache = on or off,
 | |
|  *   x0 = physical address to the FDT blob.
 | |
|  *
 | |
|  * This code is mostly position independent so you call this at
 | |
|  * __pa(PAGE_OFFSET + TEXT_OFFSET).
 | |
|  *
 | |
|  * Note that the callee-saved registers are used for storing variables
 | |
|  * that are useful before the MMU is enabled. The allocations are described
 | |
|  * in the entry routines.
 | |
|  */
 | |
| 	__HEAD
 | |
| 
 | |
| 	/*
 | |
| 	 * DO NOT MODIFY. Image header expected by Linux boot-loaders.
 | |
| 	 */
 | |
| 	b	stext				// branch to kernel start, magic
 | |
| 	.long	0				// reserved
 | |
| 	.quad	TEXT_OFFSET			// Image load offset from start of RAM
 | |
| 	.quad	0				// reserved
 | |
| 	.quad	0				// reserved
 | |
| 	.quad	0				// reserved
 | |
| 	.quad	0				// reserved
 | |
| 	.quad	0				// reserved
 | |
| 	.byte	0x41				// Magic number, "ARM\x64"
 | |
| 	.byte	0x52
 | |
| 	.byte	0x4d
 | |
| 	.byte	0x64
 | |
| 	.word	0				// reserved
 | |
| 
 | |
| ENTRY(stext)
 | |
| 	mov	x21, x0				// x21=FDT
 | |
| 	bl	el2_setup			// Drop to EL1, w20=cpu_boot_mode
 | |
| 	bl	__calc_phys_offset		// x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
 | |
| 	bl	set_cpu_boot_mode_flag
 | |
| 	mrs	x22, midr_el1			// x22=cpuid
 | |
| 	mov	x0, x22
 | |
| 	bl	lookup_processor_type
 | |
| 	mov	x23, x0				// x23=current cpu_table
 | |
| 	cbz	x23, __error_p			// invalid processor (x23=0)?
 | |
| 	bl	__vet_fdt
 | |
| 	bl	__create_page_tables		// x25=TTBR0, x26=TTBR1
 | |
| 	/*
 | |
| 	 * The following calls CPU specific code in a position independent
 | |
| 	 * manner. See arch/arm64/mm/proc.S for details. x23 = base of
 | |
| 	 * cpu_info structure selected by lookup_processor_type above.
 | |
| 	 * On return, the CPU will be ready for the MMU to be turned on and
 | |
| 	 * the TCR will have been set.
 | |
| 	 */
 | |
| 	ldr	x27, __switch_data		// address to jump to after
 | |
| 						// MMU has been enabled
 | |
| 	adr	lr, __enable_mmu		// return (PIC) address
 | |
| 	ldr	x12, [x23, #CPU_INFO_SETUP]
 | |
| 	add	x12, x12, x28			// __virt_to_phys
 | |
| 	br	x12				// initialise processor
 | |
| ENDPROC(stext)
 | |
| 
 | |
| /*
 | |
|  * If we're fortunate enough to boot at EL2, ensure that the world is
 | |
|  * sane before dropping to EL1.
 | |
|  *
 | |
|  * Returns either BOOT_CPU_MODE_EL1 or BOOT_CPU_MODE_EL2 in x20 if
 | |
|  * booted in EL1 or EL2 respectively.
 | |
|  */
 | |
| ENTRY(el2_setup)
 | |
| 	mrs	x0, CurrentEL
 | |
| 	cmp	x0, #PSR_MODE_EL2t
 | |
| 	ccmp	x0, #PSR_MODE_EL2h, #0x4, ne
 | |
| 	b.ne	1f
 | |
| 	mrs	x0, sctlr_el2
 | |
| CPU_BE(	orr	x0, x0, #(1 << 25)	)	// Set the EE bit for EL2
 | |
| CPU_LE(	bic	x0, x0, #(1 << 25)	)	// Clear the EE bit for EL2
 | |
| 	msr	sctlr_el2, x0
 | |
| 	b	2f
 | |
| 1:	mrs	x0, sctlr_el1
 | |
| CPU_BE(	orr	x0, x0, #(3 << 24)	)	// Set the EE and E0E bits for EL1
 | |
| CPU_LE(	bic	x0, x0, #(3 << 24)	)	// Clear the EE and E0E bits for EL1
 | |
| 	msr	sctlr_el1, x0
 | |
| 	mov	w20, #BOOT_CPU_MODE_EL1		// This cpu booted in EL1
 | |
| 	isb
 | |
| 	ret
 | |
| 
 | |
| 	/* Hyp configuration. */
 | |
| 2:	mov	x0, #(1 << 31)			// 64-bit EL1
 | |
| 	msr	hcr_el2, x0
 | |
| 
 | |
| 	/* Generic timers. */
 | |
| 	mrs	x0, cnthctl_el2
 | |
| 	orr	x0, x0, #3			// Enable EL1 physical timers
 | |
| 	msr	cnthctl_el2, x0
 | |
| 	msr	cntvoff_el2, xzr		// Clear virtual offset
 | |
| 
 | |
| 	/* Populate ID registers. */
 | |
| 	mrs	x0, midr_el1
 | |
| 	mrs	x1, mpidr_el1
 | |
| 	msr	vpidr_el2, x0
 | |
| 	msr	vmpidr_el2, x1
 | |
| 
 | |
| 	/* sctlr_el1 */
 | |
| 	mov	x0, #0x0800			// Set/clear RES{1,0} bits
 | |
| CPU_BE(	movk	x0, #0x33d0, lsl #16	)	// Set EE and E0E on BE systems
 | |
| CPU_LE(	movk	x0, #0x30d0, lsl #16	)	// Clear EE and E0E on LE systems
 | |
| 	msr	sctlr_el1, x0
 | |
| 
 | |
| 	/* Coprocessor traps. */
 | |
| 	mov	x0, #0x33ff
 | |
| 	msr	cptr_el2, x0			// Disable copro. traps to EL2
 | |
| 
 | |
| #ifdef CONFIG_COMPAT
 | |
| 	msr	hstr_el2, xzr			// Disable CP15 traps to EL2
 | |
| #endif
 | |
| 
 | |
| 	/* Stage-2 translation */
 | |
| 	msr	vttbr_el2, xzr
 | |
| 
 | |
| 	/* Hypervisor stub */
 | |
| 	adr	x0, __hyp_stub_vectors
 | |
| 	msr	vbar_el2, x0
 | |
| 
 | |
| 	/* spsr */
 | |
| 	mov	x0, #(PSR_F_BIT | PSR_I_BIT | PSR_A_BIT | PSR_D_BIT |\
 | |
| 		      PSR_MODE_EL1h)
 | |
| 	msr	spsr_el2, x0
 | |
| 	msr	elr_el2, lr
 | |
| 	mov	w20, #BOOT_CPU_MODE_EL2		// This CPU booted in EL2
 | |
| 	eret
 | |
| ENDPROC(el2_setup)
 | |
| 
 | |
| /*
 | |
|  * Sets the __boot_cpu_mode flag depending on the CPU boot mode passed
 | |
|  * in x20. See arch/arm64/include/asm/virt.h for more info.
 | |
|  */
 | |
| ENTRY(set_cpu_boot_mode_flag)
 | |
| 	ldr	x1, =__boot_cpu_mode		// Compute __boot_cpu_mode
 | |
| 	add	x1, x1, x28
 | |
| 	cmp	w20, #BOOT_CPU_MODE_EL2
 | |
| 	b.ne	1f
 | |
| 	add	x1, x1, #4
 | |
| 1:	dc	cvac, x1			// Clean potentially dirty cache line
 | |
| 	dsb	sy
 | |
| 	str	w20, [x1]			// This CPU has booted in EL1
 | |
| 	dc	civac, x1			// Clean&invalidate potentially stale cache line
 | |
| 	dsb	sy
 | |
| 	ret
 | |
| ENDPROC(set_cpu_boot_mode_flag)
 | |
| 
 | |
| /*
 | |
|  * We need to find out the CPU boot mode long after boot, so we need to
 | |
|  * store it in a writable variable.
 | |
|  *
 | |
|  * This is not in .bss, because we set it sufficiently early that the boot-time
 | |
|  * zeroing of .bss would clobber it.
 | |
|  */
 | |
| 	.pushsection	.data..cacheline_aligned
 | |
| ENTRY(__boot_cpu_mode)
 | |
| 	.align	L1_CACHE_SHIFT
 | |
| 	.long	BOOT_CPU_MODE_EL2
 | |
| 	.long	0
 | |
| 	.popsection
 | |
| 
 | |
| 	.align	3
 | |
| 2:	.quad	.
 | |
| 	.quad	PAGE_OFFSET
 | |
| 
 | |
| #ifdef CONFIG_SMP
 | |
| 	.align	3
 | |
| 1:	.quad	.
 | |
| 	.quad	secondary_holding_pen_release
 | |
| 
 | |
| 	/*
 | |
| 	 * This provides a "holding pen" for platforms to hold all secondary
 | |
| 	 * cores are held until we're ready for them to initialise.
 | |
| 	 */
 | |
| ENTRY(secondary_holding_pen)
 | |
| 	bl	el2_setup			// Drop to EL1, w20=cpu_boot_mode
 | |
| 	bl	__calc_phys_offset		// x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
 | |
| 	bl	set_cpu_boot_mode_flag
 | |
| 	mrs	x0, mpidr_el1
 | |
| 	ldr     x1, =MPIDR_HWID_BITMASK
 | |
| 	and	x0, x0, x1
 | |
| 	adr	x1, 1b
 | |
| 	ldp	x2, x3, [x1]
 | |
| 	sub	x1, x1, x2
 | |
| 	add	x3, x3, x1
 | |
| pen:	ldr	x4, [x3]
 | |
| 	cmp	x4, x0
 | |
| 	b.eq	secondary_startup
 | |
| 	wfe
 | |
| 	b	pen
 | |
| ENDPROC(secondary_holding_pen)
 | |
| 
 | |
| 	/*
 | |
| 	 * Secondary entry point that jumps straight into the kernel. Only to
 | |
| 	 * be used where CPUs are brought online dynamically by the kernel.
 | |
| 	 */
 | |
| ENTRY(secondary_entry)
 | |
| 	bl	el2_setup			// Drop to EL1
 | |
| 	bl	__calc_phys_offset		// x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
 | |
| 	bl	set_cpu_boot_mode_flag
 | |
| 	b	secondary_startup
 | |
| ENDPROC(secondary_entry)
 | |
| 
 | |
| ENTRY(secondary_startup)
 | |
| 	/*
 | |
| 	 * Common entry point for secondary CPUs.
 | |
| 	 */
 | |
| 	mrs	x22, midr_el1			// x22=cpuid
 | |
| 	mov	x0, x22
 | |
| 	bl	lookup_processor_type
 | |
| 	mov	x23, x0				// x23=current cpu_table
 | |
| 	cbz	x23, __error_p			// invalid processor (x23=0)?
 | |
| 
 | |
| 	pgtbl	x25, x26, x24			// x25=TTBR0, x26=TTBR1
 | |
| 	ldr	x12, [x23, #CPU_INFO_SETUP]
 | |
| 	add	x12, x12, x28			// __virt_to_phys
 | |
| 	blr	x12				// initialise processor
 | |
| 
 | |
| 	ldr	x21, =secondary_data
 | |
| 	ldr	x27, =__secondary_switched	// address to jump to after enabling the MMU
 | |
| 	b	__enable_mmu
 | |
| ENDPROC(secondary_startup)
 | |
| 
 | |
| ENTRY(__secondary_switched)
 | |
| 	ldr	x0, [x21]			// get secondary_data.stack
 | |
| 	mov	sp, x0
 | |
| 	mov	x29, #0
 | |
| 	b	secondary_start_kernel
 | |
| ENDPROC(__secondary_switched)
 | |
| #endif	/* CONFIG_SMP */
 | |
| 
 | |
| /*
 | |
|  * Setup common bits before finally enabling the MMU. Essentially this is just
 | |
|  * loading the page table pointer and vector base registers.
 | |
|  *
 | |
|  * On entry to this code, x0 must contain the SCTLR_EL1 value for turning on
 | |
|  * the MMU.
 | |
|  */
 | |
| __enable_mmu:
 | |
| 	ldr	x5, =vectors
 | |
| 	msr	vbar_el1, x5
 | |
| 	msr	ttbr0_el1, x25			// load TTBR0
 | |
| 	msr	ttbr1_el1, x26			// load TTBR1
 | |
| 	isb
 | |
| 	b	__turn_mmu_on
 | |
| ENDPROC(__enable_mmu)
 | |
| 
 | |
| /*
 | |
|  * Enable the MMU. This completely changes the structure of the visible memory
 | |
|  * space. You will not be able to trace execution through this.
 | |
|  *
 | |
|  *  x0  = system control register
 | |
|  *  x27 = *virtual* address to jump to upon completion
 | |
|  *
 | |
|  * other registers depend on the function called upon completion
 | |
|  */
 | |
| 	.align	6
 | |
| __turn_mmu_on:
 | |
| 	msr	sctlr_el1, x0
 | |
| 	isb
 | |
| 	br	x27
 | |
| ENDPROC(__turn_mmu_on)
 | |
| 
 | |
| /*
 | |
|  * Calculate the start of physical memory.
 | |
|  */
 | |
| __calc_phys_offset:
 | |
| 	adr	x0, 1f
 | |
| 	ldp	x1, x2, [x0]
 | |
| 	sub	x28, x0, x1			// x28 = PHYS_OFFSET - PAGE_OFFSET
 | |
| 	add	x24, x2, x28			// x24 = PHYS_OFFSET
 | |
| 	ret
 | |
| ENDPROC(__calc_phys_offset)
 | |
| 
 | |
| 	.align 3
 | |
| 1:	.quad	.
 | |
| 	.quad	PAGE_OFFSET
 | |
| 
 | |
| /*
 | |
|  * Macro to populate the PGD for the corresponding block entry in the next
 | |
|  * level (tbl) for the given virtual address.
 | |
|  *
 | |
|  * Preserves:	pgd, tbl, virt
 | |
|  * Corrupts:	tmp1, tmp2
 | |
|  */
 | |
| 	.macro	create_pgd_entry, pgd, tbl, virt, tmp1, tmp2
 | |
| 	lsr	\tmp1, \virt, #PGDIR_SHIFT
 | |
| 	and	\tmp1, \tmp1, #PTRS_PER_PGD - 1	// PGD index
 | |
| 	orr	\tmp2, \tbl, #3			// PGD entry table type
 | |
| 	str	\tmp2, [\pgd, \tmp1, lsl #3]
 | |
| 	.endm
 | |
| 
 | |
| /*
 | |
|  * Macro to populate block entries in the page table for the start..end
 | |
|  * virtual range (inclusive).
 | |
|  *
 | |
|  * Preserves:	tbl, flags
 | |
|  * Corrupts:	phys, start, end, pstate
 | |
|  */
 | |
| 	.macro	create_block_map, tbl, flags, phys, start, end
 | |
| 	lsr	\phys, \phys, #BLOCK_SHIFT
 | |
| 	lsr	\start, \start, #BLOCK_SHIFT
 | |
| 	and	\start, \start, #PTRS_PER_PTE - 1	// table index
 | |
| 	orr	\phys, \flags, \phys, lsl #BLOCK_SHIFT	// table entry
 | |
| 	lsr	\end, \end, #BLOCK_SHIFT
 | |
| 	and	\end, \end, #PTRS_PER_PTE - 1		// table end index
 | |
| 9999:	str	\phys, [\tbl, \start, lsl #3]		// store the entry
 | |
| 	add	\start, \start, #1			// next entry
 | |
| 	add	\phys, \phys, #BLOCK_SIZE		// next block
 | |
| 	cmp	\start, \end
 | |
| 	b.ls	9999b
 | |
| 	.endm
 | |
| 
 | |
| /*
 | |
|  * Setup the initial page tables. We only setup the barest amount which is
 | |
|  * required to get the kernel running. The following sections are required:
 | |
|  *   - identity mapping to enable the MMU (low address, TTBR0)
 | |
|  *   - first few MB of the kernel linear mapping to jump to once the MMU has
 | |
|  *     been enabled, including the FDT blob (TTBR1)
 | |
|  *   - pgd entry for fixed mappings (TTBR1)
 | |
|  */
 | |
| __create_page_tables:
 | |
| 	pgtbl	x25, x26, x24			// idmap_pg_dir and swapper_pg_dir addresses
 | |
| 	mov	x27, lr
 | |
| 
 | |
| 	/*
 | |
| 	 * Invalidate the idmap and swapper page tables to avoid potential
 | |
| 	 * dirty cache lines being evicted.
 | |
| 	 */
 | |
| 	mov	x0, x25
 | |
| 	add	x1, x26, #SWAPPER_DIR_SIZE
 | |
| 	bl	__inval_cache_range
 | |
| 
 | |
| 	/*
 | |
| 	 * Clear the idmap and swapper page tables.
 | |
| 	 */
 | |
| 	mov	x0, x25
 | |
| 	add	x6, x26, #SWAPPER_DIR_SIZE
 | |
| 1:	stp	xzr, xzr, [x0], #16
 | |
| 	stp	xzr, xzr, [x0], #16
 | |
| 	stp	xzr, xzr, [x0], #16
 | |
| 	stp	xzr, xzr, [x0], #16
 | |
| 	cmp	x0, x6
 | |
| 	b.lo	1b
 | |
| 
 | |
| 	ldr	x7, =MM_MMUFLAGS
 | |
| 
 | |
| 	/*
 | |
| 	 * Create the identity mapping.
 | |
| 	 */
 | |
| 	add	x0, x25, #PAGE_SIZE		// section table address
 | |
| 	ldr	x3, =KERNEL_START
 | |
| 	add	x3, x3, x28			// __pa(KERNEL_START)
 | |
| 	create_pgd_entry x25, x0, x3, x5, x6
 | |
| 	ldr	x6, =KERNEL_END
 | |
| 	mov	x5, x3				// __pa(KERNEL_START)
 | |
| 	add	x6, x6, x28			// __pa(KERNEL_END)
 | |
| 	create_block_map x0, x7, x3, x5, x6
 | |
| 
 | |
| 	/*
 | |
| 	 * Map the kernel image (starting with PHYS_OFFSET).
 | |
| 	 */
 | |
| 	add	x0, x26, #PAGE_SIZE		// section table address
 | |
| 	mov	x5, #PAGE_OFFSET
 | |
| 	create_pgd_entry x26, x0, x5, x3, x6
 | |
| 	ldr	x6, =KERNEL_END
 | |
| 	mov	x3, x24				// phys offset
 | |
| 	create_block_map x0, x7, x3, x5, x6
 | |
| 
 | |
| 	/*
 | |
| 	 * Map the FDT blob (maximum 2MB; must be within 512MB of
 | |
| 	 * PHYS_OFFSET).
 | |
| 	 */
 | |
| 	mov	x3, x21				// FDT phys address
 | |
| 	and	x3, x3, #~((1 << 21) - 1)	// 2MB aligned
 | |
| 	mov	x6, #PAGE_OFFSET
 | |
| 	sub	x5, x3, x24			// subtract PHYS_OFFSET
 | |
| 	tst	x5, #~((1 << 29) - 1)		// within 512MB?
 | |
| 	csel	x21, xzr, x21, ne		// zero the FDT pointer
 | |
| 	b.ne	1f
 | |
| 	add	x5, x5, x6			// __va(FDT blob)
 | |
| 	add	x6, x5, #1 << 21		// 2MB for the FDT blob
 | |
| 	sub	x6, x6, #1			// inclusive range
 | |
| 	create_block_map x0, x7, x3, x5, x6
 | |
| 1:
 | |
| 	/*
 | |
| 	 * Create the pgd entry for the fixed mappings.
 | |
| 	 */
 | |
| 	ldr	x5, =FIXADDR_TOP		// Fixed mapping virtual address
 | |
| 	add	x0, x26, #2 * PAGE_SIZE		// section table address
 | |
| 	create_pgd_entry x26, x0, x5, x6, x7
 | |
| 
 | |
| 	/*
 | |
| 	 * Since the page tables have been populated with non-cacheable
 | |
| 	 * accesses (MMU disabled), invalidate the idmap and swapper page
 | |
| 	 * tables again to remove any speculatively loaded cache lines.
 | |
| 	 */
 | |
| 	mov	x0, x25
 | |
| 	add	x1, x26, #SWAPPER_DIR_SIZE
 | |
| 	bl	__inval_cache_range
 | |
| 
 | |
| 	mov	lr, x27
 | |
| 	ret
 | |
| ENDPROC(__create_page_tables)
 | |
| 	.ltorg
 | |
| 
 | |
| 	.align	3
 | |
| 	.type	__switch_data, %object
 | |
| __switch_data:
 | |
| 	.quad	__mmap_switched
 | |
| 	.quad	__bss_start			// x6
 | |
| 	.quad	_end				// x7
 | |
| 	.quad	processor_id			// x4
 | |
| 	.quad	__fdt_pointer			// x5
 | |
| 	.quad	memstart_addr			// x6
 | |
| 	.quad	init_thread_union + THREAD_START_SP // sp
 | |
| 
 | |
| /*
 | |
|  * The following fragment of code is executed with the MMU on in MMU mode, and
 | |
|  * uses absolute addresses; this is not position independent.
 | |
|  */
 | |
| __mmap_switched:
 | |
| 	adr	x3, __switch_data + 8
 | |
| 
 | |
| 	ldp	x6, x7, [x3], #16
 | |
| 1:	cmp	x6, x7
 | |
| 	b.hs	2f
 | |
| 	str	xzr, [x6], #8			// Clear BSS
 | |
| 	b	1b
 | |
| 2:
 | |
| 	ldp	x4, x5, [x3], #16
 | |
| 	ldr	x6, [x3], #8
 | |
| 	ldr	x16, [x3]
 | |
| 	mov	sp, x16
 | |
| 	str	x22, [x4]			// Save processor ID
 | |
| 	str	x21, [x5]			// Save FDT pointer
 | |
| 	str	x24, [x6]			// Save PHYS_OFFSET
 | |
| 	mov	x29, #0
 | |
| 	b	start_kernel
 | |
| ENDPROC(__mmap_switched)
 | |
| 
 | |
| /*
 | |
|  * Exception handling. Something went wrong and we can't proceed. We ought to
 | |
|  * tell the user, but since we don't have any guarantee that we're even
 | |
|  * running on the right architecture, we do virtually nothing.
 | |
|  */
 | |
| __error_p:
 | |
| ENDPROC(__error_p)
 | |
| 
 | |
| __error:
 | |
| 1:	nop
 | |
| 	b	1b
 | |
| ENDPROC(__error)
 | |
| 
 | |
| /*
 | |
|  * This function gets the processor ID in w0 and searches the cpu_table[] for
 | |
|  * a match. It returns a pointer to the struct cpu_info it found. The
 | |
|  * cpu_table[] must end with an empty (all zeros) structure.
 | |
|  *
 | |
|  * This routine can be called via C code and it needs to work with the MMU
 | |
|  * both disabled and enabled (the offset is calculated automatically).
 | |
|  */
 | |
| ENTRY(lookup_processor_type)
 | |
| 	adr	x1, __lookup_processor_type_data
 | |
| 	ldp	x2, x3, [x1]
 | |
| 	sub	x1, x1, x2			// get offset between VA and PA
 | |
| 	add	x3, x3, x1			// convert VA to PA
 | |
| 1:
 | |
| 	ldp	w5, w6, [x3]			// load cpu_id_val and cpu_id_mask
 | |
| 	cbz	w5, 2f				// end of list?
 | |
| 	and	w6, w6, w0
 | |
| 	cmp	w5, w6
 | |
| 	b.eq	3f
 | |
| 	add	x3, x3, #CPU_INFO_SZ
 | |
| 	b	1b
 | |
| 2:
 | |
| 	mov	x3, #0				// unknown processor
 | |
| 3:
 | |
| 	mov	x0, x3
 | |
| 	ret
 | |
| ENDPROC(lookup_processor_type)
 | |
| 
 | |
| 	.align	3
 | |
| 	.type	__lookup_processor_type_data, %object
 | |
| __lookup_processor_type_data:
 | |
| 	.quad	.
 | |
| 	.quad	cpu_table
 | |
| 	.size	__lookup_processor_type_data, . - __lookup_processor_type_data
 | |
| 
 | |
| /*
 | |
|  * Determine validity of the x21 FDT pointer.
 | |
|  * The dtb must be 8-byte aligned and live in the first 512M of memory.
 | |
|  */
 | |
| __vet_fdt:
 | |
| 	tst	x21, #0x7
 | |
| 	b.ne	1f
 | |
| 	cmp	x21, x24
 | |
| 	b.lt	1f
 | |
| 	mov	x0, #(1 << 29)
 | |
| 	add	x0, x0, x24
 | |
| 	cmp	x21, x0
 | |
| 	b.ge	1f
 | |
| 	ret
 | |
| 1:
 | |
| 	mov	x21, #0
 | |
| 	ret
 | |
| ENDPROC(__vet_fdt)
 |