2012-03-05 19:49:27 +08:00
|
|
|
/*
|
|
|
|
* Low-level CPU initialisation
|
|
|
|
* Based on arch/arm/kernel/head.S
|
|
|
|
*
|
|
|
|
* Copyright (C) 1994-2002 Russell King
|
|
|
|
* Copyright (C) 2003-2012 ARM Ltd.
|
|
|
|
* Authors: Catalin Marinas <catalin.marinas@arm.com>
|
|
|
|
* Will Deacon <will.deacon@arm.com>
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
|
|
* published by the Free Software Foundation.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/linkage.h>
|
|
|
|
#include <linux/init.h>
|
|
|
|
|
|
|
|
#include <asm/assembler.h>
|
|
|
|
#include <asm/ptrace.h>
|
|
|
|
#include <asm/asm-offsets.h>
|
2014-03-27 02:25:55 +08:00
|
|
|
#include <asm/cache.h>
|
2012-08-30 01:32:18 +08:00
|
|
|
#include <asm/cputype.h>
|
2012-03-05 19:49:27 +08:00
|
|
|
#include <asm/memory.h>
|
|
|
|
#include <asm/thread_info.h>
|
|
|
|
#include <asm/pgtable-hwdef.h>
|
|
|
|
#include <asm/pgtable.h>
|
|
|
|
#include <asm/page.h>
|
2012-10-26 22:40:05 +08:00
|
|
|
#include <asm/virt.h>
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
#define KERNEL_RAM_VADDR (PAGE_OFFSET + TEXT_OFFSET)
|
|
|
|
|
2014-06-24 23:51:37 +08:00
|
|
|
#if (TEXT_OFFSET & 0xf) != 0
|
|
|
|
#error TEXT_OFFSET must be at least 16B aligned
|
|
|
|
#elif (PAGE_OFFSET & 0xfffff) != 0
|
|
|
|
#error PAGE_OFFSET must be at least 2MB aligned
|
|
|
|
#elif TEXT_OFFSET > 0xfffff
|
|
|
|
#error TEXT_OFFSET must be less than 2MB
|
2012-03-05 19:49:27 +08:00
|
|
|
#endif
|
|
|
|
|
2014-06-24 23:51:35 +08:00
|
|
|
.macro pgtbl, ttb0, ttb1, virt_to_phys
|
|
|
|
ldr \ttb1, =swapper_pg_dir
|
|
|
|
ldr \ttb0, =idmap_pg_dir
|
|
|
|
add \ttb1, \ttb1, \virt_to_phys
|
|
|
|
add \ttb0, \ttb0, \virt_to_phys
|
2012-03-05 19:49:27 +08:00
|
|
|
.endm
|
|
|
|
|
|
|
|
#ifdef CONFIG_ARM64_64K_PAGES
|
|
|
|
#define BLOCK_SHIFT PAGE_SHIFT
|
|
|
|
#define BLOCK_SIZE PAGE_SIZE
|
|
|
|
#else
|
|
|
|
#define BLOCK_SHIFT SECTION_SHIFT
|
|
|
|
#define BLOCK_SIZE SECTION_SIZE
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define KERNEL_START KERNEL_RAM_VADDR
|
|
|
|
#define KERNEL_END _end
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Initial memory map attributes.
|
|
|
|
*/
|
|
|
|
#ifndef CONFIG_SMP
|
|
|
|
#define PTE_FLAGS PTE_TYPE_PAGE | PTE_AF
|
|
|
|
#define PMD_FLAGS PMD_TYPE_SECT | PMD_SECT_AF
|
|
|
|
#else
|
|
|
|
#define PTE_FLAGS PTE_TYPE_PAGE | PTE_AF | PTE_SHARED
|
|
|
|
#define PMD_FLAGS PMD_TYPE_SECT | PMD_SECT_AF | PMD_SECT_S
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef CONFIG_ARM64_64K_PAGES
|
|
|
|
#define MM_MMUFLAGS PTE_ATTRINDX(MT_NORMAL) | PTE_FLAGS
|
|
|
|
#else
|
|
|
|
#define MM_MMUFLAGS PMD_ATTRINDX(MT_NORMAL) | PMD_FLAGS
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Kernel startup entry point.
|
|
|
|
* ---------------------------
|
|
|
|
*
|
|
|
|
* The requirements are:
|
|
|
|
* MMU = off, D-cache = off, I-cache = on or off,
|
|
|
|
* x0 = physical address to the FDT blob.
|
|
|
|
*
|
|
|
|
* This code is mostly position independent so you call this at
|
|
|
|
* __pa(PAGE_OFFSET + TEXT_OFFSET).
|
|
|
|
*
|
|
|
|
* Note that the callee-saved registers are used for storing variables
|
|
|
|
* that are useful before the MMU is enabled. The allocations are described
|
|
|
|
* in the entry routines.
|
|
|
|
*/
|
|
|
|
__HEAD
|
|
|
|
|
|
|
|
/*
|
|
|
|
* DO NOT MODIFY. Image header expected by Linux boot-loaders.
|
|
|
|
*/
|
2014-04-16 10:47:52 +08:00
|
|
|
#ifdef CONFIG_EFI
|
|
|
|
efi_head:
|
|
|
|
/*
|
|
|
|
* This add instruction has no meaningful effect except that
|
|
|
|
* its opcode forms the magic "MZ" signature required by UEFI.
|
|
|
|
*/
|
|
|
|
add x13, x18, #0x16
|
|
|
|
b stext
|
|
|
|
#else
|
2012-03-05 19:49:27 +08:00
|
|
|
b stext // branch to kernel start, magic
|
|
|
|
.long 0 // reserved
|
2014-04-16 10:47:52 +08:00
|
|
|
#endif
|
arm64: Update the Image header
Currently the kernel Image is stripped of everything past the initial
stack, and at runtime the memory is initialised and used by the kernel.
This makes the effective minimum memory footprint of the kernel larger
than the size of the loaded binary, though bootloaders have no mechanism
to identify how large this minimum memory footprint is. This makes it
difficult to choose safe locations to place both the kernel and other
binaries required at boot (DTB, initrd, etc), such that the kernel won't
clobber said binaries or other reserved memory during initialisation.
Additionally when big endian support was added the image load offset was
overlooked, and is currently of an arbitrary endianness, which makes it
difficult for bootloaders to make use of it. It seems that bootloaders
aren't respecting the image load offset at present anyway, and are
assuming that offset 0x80000 will always be correct.
This patch adds an effective image size to the kernel header which
describes the amount of memory from the start of the kernel Image binary
which the kernel expects to use before detecting memory and handling any
memory reservations. This can be used by bootloaders to choose suitable
locations to load the kernel and/or other binaries such that the kernel
will not clobber any memory unexpectedly. As before, memory reservations
are required to prevent the kernel from clobbering these locations
later.
Both the image load offset and the effective image size are forced to be
little-endian regardless of the native endianness of the kernel to
enable bootloaders to load a kernel of arbitrary endianness. Bootloaders
which wish to make use of the load offset can inspect the effective
image size field for a non-zero value to determine if the offset is of a
known endianness. To enable software to determine the endinanness of the
kernel as may be required for certain use-cases, a new flags field (also
little-endian) is added to the kernel header to export this information.
The documentation is updated to clarify these details. To discourage
future assumptions regarding the value of text_offset, the value at this
point in time is removed from the main flow of the documentation (though
kept as a compatibility note). Some minor formatting issues in the
documentation are also corrected.
Signed-off-by: Mark Rutland <mark.rutland@arm.com>
Acked-by: Tom Rini <trini@ti.com>
Cc: Geoff Levand <geoff@infradead.org>
Cc: Kevin Hilman <kevin.hilman@linaro.org>
Acked-by: Will Deacon <will.deacon@arm.com>
Signed-off-by: Catalin Marinas <catalin.marinas@arm.com>
2014-06-24 23:51:36 +08:00
|
|
|
.quad _kernel_offset_le // Image load offset from start of RAM, little-endian
|
|
|
|
.quad _kernel_size_le // Effective size of kernel image, little-endian
|
|
|
|
.quad _kernel_flags_le // Informative flags, little-endian
|
2013-08-15 07:10:00 +08:00
|
|
|
.quad 0 // reserved
|
|
|
|
.quad 0 // reserved
|
|
|
|
.quad 0 // reserved
|
|
|
|
.byte 0x41 // Magic number, "ARM\x64"
|
|
|
|
.byte 0x52
|
|
|
|
.byte 0x4d
|
|
|
|
.byte 0x64
|
2014-04-16 10:47:52 +08:00
|
|
|
#ifdef CONFIG_EFI
|
|
|
|
.long pe_header - efi_head // Offset to the PE header.
|
|
|
|
#else
|
2013-08-15 07:10:00 +08:00
|
|
|
.word 0 // reserved
|
2014-04-16 10:47:52 +08:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef CONFIG_EFI
|
|
|
|
.align 3
|
|
|
|
pe_header:
|
|
|
|
.ascii "PE"
|
|
|
|
.short 0
|
|
|
|
coff_header:
|
|
|
|
.short 0xaa64 // AArch64
|
|
|
|
.short 2 // nr_sections
|
|
|
|
.long 0 // TimeDateStamp
|
|
|
|
.long 0 // PointerToSymbolTable
|
|
|
|
.long 1 // NumberOfSymbols
|
|
|
|
.short section_table - optional_header // SizeOfOptionalHeader
|
|
|
|
.short 0x206 // Characteristics.
|
|
|
|
// IMAGE_FILE_DEBUG_STRIPPED |
|
|
|
|
// IMAGE_FILE_EXECUTABLE_IMAGE |
|
|
|
|
// IMAGE_FILE_LINE_NUMS_STRIPPED
|
|
|
|
optional_header:
|
|
|
|
.short 0x20b // PE32+ format
|
|
|
|
.byte 0x02 // MajorLinkerVersion
|
|
|
|
.byte 0x14 // MinorLinkerVersion
|
|
|
|
.long _edata - stext // SizeOfCode
|
|
|
|
.long 0 // SizeOfInitializedData
|
|
|
|
.long 0 // SizeOfUninitializedData
|
|
|
|
.long efi_stub_entry - efi_head // AddressOfEntryPoint
|
|
|
|
.long stext - efi_head // BaseOfCode
|
|
|
|
|
|
|
|
extra_header_fields:
|
|
|
|
.quad 0 // ImageBase
|
|
|
|
.long 0x20 // SectionAlignment
|
|
|
|
.long 0x8 // FileAlignment
|
|
|
|
.short 0 // MajorOperatingSystemVersion
|
|
|
|
.short 0 // MinorOperatingSystemVersion
|
|
|
|
.short 0 // MajorImageVersion
|
|
|
|
.short 0 // MinorImageVersion
|
|
|
|
.short 0 // MajorSubsystemVersion
|
|
|
|
.short 0 // MinorSubsystemVersion
|
|
|
|
.long 0 // Win32VersionValue
|
|
|
|
|
|
|
|
.long _edata - efi_head // SizeOfImage
|
|
|
|
|
|
|
|
// Everything before the kernel image is considered part of the header
|
|
|
|
.long stext - efi_head // SizeOfHeaders
|
|
|
|
.long 0 // CheckSum
|
|
|
|
.short 0xa // Subsystem (EFI application)
|
|
|
|
.short 0 // DllCharacteristics
|
|
|
|
.quad 0 // SizeOfStackReserve
|
|
|
|
.quad 0 // SizeOfStackCommit
|
|
|
|
.quad 0 // SizeOfHeapReserve
|
|
|
|
.quad 0 // SizeOfHeapCommit
|
|
|
|
.long 0 // LoaderFlags
|
|
|
|
.long 0x6 // NumberOfRvaAndSizes
|
|
|
|
|
|
|
|
.quad 0 // ExportTable
|
|
|
|
.quad 0 // ImportTable
|
|
|
|
.quad 0 // ResourceTable
|
|
|
|
.quad 0 // ExceptionTable
|
|
|
|
.quad 0 // CertificationTable
|
|
|
|
.quad 0 // BaseRelocationTable
|
|
|
|
|
|
|
|
// Section table
|
|
|
|
section_table:
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The EFI application loader requires a relocation section
|
|
|
|
* because EFI applications must be relocatable. This is a
|
|
|
|
* dummy section as far as we are concerned.
|
|
|
|
*/
|
|
|
|
.ascii ".reloc"
|
|
|
|
.byte 0
|
|
|
|
.byte 0 // end of 0 padding of section name
|
|
|
|
.long 0
|
|
|
|
.long 0
|
|
|
|
.long 0 // SizeOfRawData
|
|
|
|
.long 0 // PointerToRawData
|
|
|
|
.long 0 // PointerToRelocations
|
|
|
|
.long 0 // PointerToLineNumbers
|
|
|
|
.short 0 // NumberOfRelocations
|
|
|
|
.short 0 // NumberOfLineNumbers
|
|
|
|
.long 0x42100040 // Characteristics (section flags)
|
|
|
|
|
|
|
|
|
|
|
|
.ascii ".text"
|
|
|
|
.byte 0
|
|
|
|
.byte 0
|
|
|
|
.byte 0 // end of 0 padding of section name
|
|
|
|
.long _edata - stext // VirtualSize
|
|
|
|
.long stext - efi_head // VirtualAddress
|
|
|
|
.long _edata - stext // SizeOfRawData
|
|
|
|
.long stext - efi_head // PointerToRawData
|
|
|
|
|
|
|
|
.long 0 // PointerToRelocations (0 for executables)
|
|
|
|
.long 0 // PointerToLineNumbers (0 for executables)
|
|
|
|
.short 0 // NumberOfRelocations (0 for executables)
|
|
|
|
.short 0 // NumberOfLineNumbers (0 for executables)
|
|
|
|
.long 0xe0500020 // Characteristics (section flags)
|
|
|
|
.align 5
|
|
|
|
#endif
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
ENTRY(stext)
|
|
|
|
mov x21, x0 // x21=FDT
|
2013-10-11 21:52:16 +08:00
|
|
|
bl el2_setup // Drop to EL1, w20=cpu_boot_mode
|
2012-10-26 22:40:05 +08:00
|
|
|
bl __calc_phys_offset // x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
|
2013-10-11 21:52:16 +08:00
|
|
|
bl set_cpu_boot_mode_flag
|
2012-03-05 19:49:27 +08:00
|
|
|
mrs x22, midr_el1 // x22=cpuid
|
|
|
|
mov x0, x22
|
|
|
|
bl lookup_processor_type
|
|
|
|
mov x23, x0 // x23=current cpu_table
|
|
|
|
cbz x23, __error_p // invalid processor (x23=0)?
|
|
|
|
bl __vet_fdt
|
|
|
|
bl __create_page_tables // x25=TTBR0, x26=TTBR1
|
|
|
|
/*
|
|
|
|
* The following calls CPU specific code in a position independent
|
|
|
|
* manner. See arch/arm64/mm/proc.S for details. x23 = base of
|
|
|
|
* cpu_info structure selected by lookup_processor_type above.
|
|
|
|
* On return, the CPU will be ready for the MMU to be turned on and
|
|
|
|
* the TCR will have been set.
|
|
|
|
*/
|
|
|
|
ldr x27, __switch_data // address to jump to after
|
|
|
|
// MMU has been enabled
|
|
|
|
adr lr, __enable_mmu // return (PIC) address
|
|
|
|
ldr x12, [x23, #CPU_INFO_SETUP]
|
|
|
|
add x12, x12, x28 // __virt_to_phys
|
|
|
|
br x12 // initialise processor
|
|
|
|
ENDPROC(stext)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If we're fortunate enough to boot at EL2, ensure that the world is
|
|
|
|
* sane before dropping to EL1.
|
2013-10-11 21:52:16 +08:00
|
|
|
*
|
|
|
|
* Returns either BOOT_CPU_MODE_EL1 or BOOT_CPU_MODE_EL2 in x20 if
|
|
|
|
* booted in EL1 or EL2 respectively.
|
2012-03-05 19:49:27 +08:00
|
|
|
*/
|
|
|
|
ENTRY(el2_setup)
|
|
|
|
mrs x0, CurrentEL
|
2014-06-06 21:16:21 +08:00
|
|
|
cmp x0, #CurrentEL_EL2
|
2013-10-11 21:52:17 +08:00
|
|
|
b.ne 1f
|
|
|
|
mrs x0, sctlr_el2
|
|
|
|
CPU_BE( orr x0, x0, #(1 << 25) ) // Set the EE bit for EL2
|
|
|
|
CPU_LE( bic x0, x0, #(1 << 25) ) // Clear the EE bit for EL2
|
|
|
|
msr sctlr_el2, x0
|
|
|
|
b 2f
|
|
|
|
1: mrs x0, sctlr_el1
|
|
|
|
CPU_BE( orr x0, x0, #(3 << 24) ) // Set the EE and E0E bits for EL1
|
|
|
|
CPU_LE( bic x0, x0, #(3 << 24) ) // Clear the EE and E0E bits for EL1
|
|
|
|
msr sctlr_el1, x0
|
2013-10-11 21:52:16 +08:00
|
|
|
mov w20, #BOOT_CPU_MODE_EL1 // This cpu booted in EL1
|
2013-10-11 21:52:17 +08:00
|
|
|
isb
|
2012-03-05 19:49:27 +08:00
|
|
|
ret
|
|
|
|
|
|
|
|
/* Hyp configuration. */
|
2013-10-11 21:52:17 +08:00
|
|
|
2: mov x0, #(1 << 31) // 64-bit EL1
|
2012-03-05 19:49:27 +08:00
|
|
|
msr hcr_el2, x0
|
|
|
|
|
|
|
|
/* Generic timers. */
|
|
|
|
mrs x0, cnthctl_el2
|
|
|
|
orr x0, x0, #3 // Enable EL1 physical timers
|
|
|
|
msr cnthctl_el2, x0
|
2012-11-30 06:48:31 +08:00
|
|
|
msr cntvoff_el2, xzr // Clear virtual offset
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
/* Populate ID registers. */
|
|
|
|
mrs x0, midr_el1
|
|
|
|
mrs x1, mpidr_el1
|
|
|
|
msr vpidr_el2, x0
|
|
|
|
msr vmpidr_el2, x1
|
|
|
|
|
|
|
|
/* sctlr_el1 */
|
|
|
|
mov x0, #0x0800 // Set/clear RES{1,0} bits
|
2013-10-11 21:52:17 +08:00
|
|
|
CPU_BE( movk x0, #0x33d0, lsl #16 ) // Set EE and E0E on BE systems
|
|
|
|
CPU_LE( movk x0, #0x30d0, lsl #16 ) // Clear EE and E0E on LE systems
|
2012-03-05 19:49:27 +08:00
|
|
|
msr sctlr_el1, x0
|
|
|
|
|
|
|
|
/* Coprocessor traps. */
|
|
|
|
mov x0, #0x33ff
|
|
|
|
msr cptr_el2, x0 // Disable copro. traps to EL2
|
|
|
|
|
|
|
|
#ifdef CONFIG_COMPAT
|
|
|
|
msr hstr_el2, xzr // Disable CP15 traps to EL2
|
|
|
|
#endif
|
|
|
|
|
2012-11-07 03:27:59 +08:00
|
|
|
/* Stage-2 translation */
|
|
|
|
msr vttbr_el2, xzr
|
|
|
|
|
2012-10-20 00:46:27 +08:00
|
|
|
/* Hypervisor stub */
|
|
|
|
adr x0, __hyp_stub_vectors
|
|
|
|
msr vbar_el2, x0
|
|
|
|
|
2012-03-05 19:49:27 +08:00
|
|
|
/* spsr */
|
|
|
|
mov x0, #(PSR_F_BIT | PSR_I_BIT | PSR_A_BIT | PSR_D_BIT |\
|
|
|
|
PSR_MODE_EL1h)
|
|
|
|
msr spsr_el2, x0
|
|
|
|
msr elr_el2, lr
|
2013-10-11 21:52:16 +08:00
|
|
|
mov w20, #BOOT_CPU_MODE_EL2 // This CPU booted in EL2
|
2012-03-05 19:49:27 +08:00
|
|
|
eret
|
|
|
|
ENDPROC(el2_setup)
|
|
|
|
|
2013-10-11 21:52:16 +08:00
|
|
|
/*
|
|
|
|
* Sets the __boot_cpu_mode flag depending on the CPU boot mode passed
|
|
|
|
* in x20. See arch/arm64/include/asm/virt.h for more info.
|
|
|
|
*/
|
|
|
|
ENTRY(set_cpu_boot_mode_flag)
|
|
|
|
ldr x1, =__boot_cpu_mode // Compute __boot_cpu_mode
|
|
|
|
add x1, x1, x28
|
|
|
|
cmp w20, #BOOT_CPU_MODE_EL2
|
|
|
|
b.ne 1f
|
|
|
|
add x1, x1, #4
|
2014-05-02 23:24:13 +08:00
|
|
|
1: str w20, [x1] // This CPU has booted in EL1
|
|
|
|
dmb sy
|
|
|
|
dc ivac, x1 // Invalidate potentially stale cache line
|
2013-10-11 21:52:16 +08:00
|
|
|
ret
|
|
|
|
ENDPROC(set_cpu_boot_mode_flag)
|
|
|
|
|
2012-10-26 22:40:05 +08:00
|
|
|
/*
|
|
|
|
* We need to find out the CPU boot mode long after boot, so we need to
|
|
|
|
* store it in a writable variable.
|
|
|
|
*
|
|
|
|
* This is not in .bss, because we set it sufficiently early that the boot-time
|
|
|
|
* zeroing of .bss would clobber it.
|
|
|
|
*/
|
2014-03-27 02:25:55 +08:00
|
|
|
.pushsection .data..cacheline_aligned
|
2012-10-26 22:40:05 +08:00
|
|
|
ENTRY(__boot_cpu_mode)
|
2014-03-27 02:25:55 +08:00
|
|
|
.align L1_CACHE_SHIFT
|
2012-10-26 22:40:05 +08:00
|
|
|
.long BOOT_CPU_MODE_EL2
|
|
|
|
.long 0
|
|
|
|
.popsection
|
|
|
|
|
2012-03-05 19:49:27 +08:00
|
|
|
.align 3
|
|
|
|
2: .quad .
|
|
|
|
.quad PAGE_OFFSET
|
|
|
|
|
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
.align 3
|
|
|
|
1: .quad .
|
|
|
|
.quad secondary_holding_pen_release
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This provides a "holding pen" for platforms to hold all secondary
|
|
|
|
* cores are held until we're ready for them to initialise.
|
|
|
|
*/
|
|
|
|
ENTRY(secondary_holding_pen)
|
2013-10-11 21:52:16 +08:00
|
|
|
bl el2_setup // Drop to EL1, w20=cpu_boot_mode
|
|
|
|
bl __calc_phys_offset // x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
|
|
|
|
bl set_cpu_boot_mode_flag
|
2012-03-05 19:49:27 +08:00
|
|
|
mrs x0, mpidr_el1
|
2012-08-30 01:32:18 +08:00
|
|
|
ldr x1, =MPIDR_HWID_BITMASK
|
|
|
|
and x0, x0, x1
|
2012-03-05 19:49:27 +08:00
|
|
|
adr x1, 1b
|
|
|
|
ldp x2, x3, [x1]
|
|
|
|
sub x1, x1, x2
|
|
|
|
add x3, x3, x1
|
|
|
|
pen: ldr x4, [x3]
|
|
|
|
cmp x4, x0
|
|
|
|
b.eq secondary_startup
|
|
|
|
wfe
|
|
|
|
b pen
|
|
|
|
ENDPROC(secondary_holding_pen)
|
arm64: factor out spin-table boot method
The arm64 kernel has an internal holding pen, which is necessary for
some systems where we can't bring CPUs online individually and must hold
multiple CPUs in a safe area until the kernel is able to handle them.
The current SMP infrastructure for arm64 is closely coupled to this
holding pen, and alternative boot methods must launch CPUs into the pen,
where they sit before they are launched into the kernel proper.
With PSCI (and possibly other future boot methods), we can bring CPUs
online individually, and need not perform the secondary_holding_pen
dance. Instead, this patch factors the holding pen management code out
to the spin-table boot method code, as it is the only boot method
requiring the pen.
A new entry point for secondaries, secondary_entry is added for other
boot methods to use, which bypasses the holding pen and its associated
overhead when bringing CPUs online. The smp.pen.text section is also
removed, as the pen can live in head.text without problem.
The cpu_operations structure is extended with two new functions,
cpu_boot and cpu_postboot, for bringing a cpu into the kernel and
performing any post-boot cleanup required by a bootmethod (e.g.
resetting the secondary_holding_pen_release to INVALID_HWID).
Documentation is added for cpu_operations.
Signed-off-by: Mark Rutland <mark.rutland@arm.com>
Signed-off-by: Catalin Marinas <catalin.marinas@arm.com>
2013-10-25 03:30:16 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Secondary entry point that jumps straight into the kernel. Only to
|
|
|
|
* be used where CPUs are brought online dynamically by the kernel.
|
|
|
|
*/
|
|
|
|
ENTRY(secondary_entry)
|
|
|
|
bl el2_setup // Drop to EL1
|
2013-11-19 02:56:42 +08:00
|
|
|
bl __calc_phys_offset // x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
|
|
|
|
bl set_cpu_boot_mode_flag
|
arm64: factor out spin-table boot method
The arm64 kernel has an internal holding pen, which is necessary for
some systems where we can't bring CPUs online individually and must hold
multiple CPUs in a safe area until the kernel is able to handle them.
The current SMP infrastructure for arm64 is closely coupled to this
holding pen, and alternative boot methods must launch CPUs into the pen,
where they sit before they are launched into the kernel proper.
With PSCI (and possibly other future boot methods), we can bring CPUs
online individually, and need not perform the secondary_holding_pen
dance. Instead, this patch factors the holding pen management code out
to the spin-table boot method code, as it is the only boot method
requiring the pen.
A new entry point for secondaries, secondary_entry is added for other
boot methods to use, which bypasses the holding pen and its associated
overhead when bringing CPUs online. The smp.pen.text section is also
removed, as the pen can live in head.text without problem.
The cpu_operations structure is extended with two new functions,
cpu_boot and cpu_postboot, for bringing a cpu into the kernel and
performing any post-boot cleanup required by a bootmethod (e.g.
resetting the secondary_holding_pen_release to INVALID_HWID).
Documentation is added for cpu_operations.
Signed-off-by: Mark Rutland <mark.rutland@arm.com>
Signed-off-by: Catalin Marinas <catalin.marinas@arm.com>
2013-10-25 03:30:16 +08:00
|
|
|
b secondary_startup
|
|
|
|
ENDPROC(secondary_entry)
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
ENTRY(secondary_startup)
|
|
|
|
/*
|
|
|
|
* Common entry point for secondary CPUs.
|
|
|
|
*/
|
|
|
|
mrs x22, midr_el1 // x22=cpuid
|
|
|
|
mov x0, x22
|
|
|
|
bl lookup_processor_type
|
|
|
|
mov x23, x0 // x23=current cpu_table
|
|
|
|
cbz x23, __error_p // invalid processor (x23=0)?
|
|
|
|
|
2014-06-24 23:51:35 +08:00
|
|
|
pgtbl x25, x26, x28 // x25=TTBR0, x26=TTBR1
|
2012-03-05 19:49:27 +08:00
|
|
|
ldr x12, [x23, #CPU_INFO_SETUP]
|
|
|
|
add x12, x12, x28 // __virt_to_phys
|
|
|
|
blr x12 // initialise processor
|
|
|
|
|
|
|
|
ldr x21, =secondary_data
|
|
|
|
ldr x27, =__secondary_switched // address to jump to after enabling the MMU
|
|
|
|
b __enable_mmu
|
|
|
|
ENDPROC(secondary_startup)
|
|
|
|
|
|
|
|
ENTRY(__secondary_switched)
|
|
|
|
ldr x0, [x21] // get secondary_data.stack
|
|
|
|
mov sp, x0
|
|
|
|
mov x29, #0
|
|
|
|
b secondary_start_kernel
|
|
|
|
ENDPROC(__secondary_switched)
|
|
|
|
#endif /* CONFIG_SMP */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Setup common bits before finally enabling the MMU. Essentially this is just
|
|
|
|
* loading the page table pointer and vector base registers.
|
|
|
|
*
|
|
|
|
* On entry to this code, x0 must contain the SCTLR_EL1 value for turning on
|
|
|
|
* the MMU.
|
|
|
|
*/
|
|
|
|
__enable_mmu:
|
|
|
|
ldr x5, =vectors
|
|
|
|
msr vbar_el1, x5
|
|
|
|
msr ttbr0_el1, x25 // load TTBR0
|
|
|
|
msr ttbr1_el1, x26 // load TTBR1
|
|
|
|
isb
|
|
|
|
b __turn_mmu_on
|
|
|
|
ENDPROC(__enable_mmu)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Enable the MMU. This completely changes the structure of the visible memory
|
|
|
|
* space. You will not be able to trace execution through this.
|
|
|
|
*
|
|
|
|
* x0 = system control register
|
|
|
|
* x27 = *virtual* address to jump to upon completion
|
|
|
|
*
|
|
|
|
* other registers depend on the function called upon completion
|
2014-06-24 23:51:34 +08:00
|
|
|
*
|
|
|
|
* We align the entire function to the smallest power of two larger than it to
|
|
|
|
* ensure it fits within a single block map entry. Otherwise were PHYS_OFFSET
|
|
|
|
* close to the end of a 512MB or 1GB block we might require an additional
|
|
|
|
* table to map the entire function.
|
2012-03-05 19:49:27 +08:00
|
|
|
*/
|
2014-06-24 23:51:34 +08:00
|
|
|
.align 4
|
2012-03-05 19:49:27 +08:00
|
|
|
__turn_mmu_on:
|
|
|
|
msr sctlr_el1, x0
|
|
|
|
isb
|
|
|
|
br x27
|
|
|
|
ENDPROC(__turn_mmu_on)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Calculate the start of physical memory.
|
|
|
|
*/
|
|
|
|
__calc_phys_offset:
|
|
|
|
adr x0, 1f
|
|
|
|
ldp x1, x2, [x0]
|
|
|
|
sub x28, x0, x1 // x28 = PHYS_OFFSET - PAGE_OFFSET
|
|
|
|
add x24, x2, x28 // x24 = PHYS_OFFSET
|
|
|
|
ret
|
|
|
|
ENDPROC(__calc_phys_offset)
|
|
|
|
|
|
|
|
.align 3
|
|
|
|
1: .quad .
|
|
|
|
.quad PAGE_OFFSET
|
|
|
|
|
|
|
|
/*
|
2014-05-12 17:40:51 +08:00
|
|
|
* Macro to populate the PUD for the corresponding block entry in the next
|
|
|
|
* level (tbl) for the given virtual address in case of 4 levels.
|
2012-03-05 19:49:27 +08:00
|
|
|
*
|
2014-05-12 17:40:51 +08:00
|
|
|
* Preserves: pgd, virt
|
|
|
|
* Corrupts: tbl, tmp1, tmp2
|
|
|
|
* Returns: pud
|
2012-03-05 19:49:27 +08:00
|
|
|
*/
|
2014-05-12 17:40:51 +08:00
|
|
|
.macro create_pud_entry, pgd, tbl, virt, pud, tmp1, tmp2
|
|
|
|
#ifdef CONFIG_ARM64_4_LEVELS
|
|
|
|
add \tbl, \tbl, #PAGE_SIZE // bump tbl 1 page up.
|
|
|
|
// to make room for pud
|
|
|
|
add \pud, \pgd, #PAGE_SIZE // pgd points to pud which
|
|
|
|
// follows pgd
|
|
|
|
lsr \tmp1, \virt, #PUD_SHIFT
|
|
|
|
and \tmp1, \tmp1, #PTRS_PER_PUD - 1 // PUD index
|
|
|
|
orr \tmp2, \tbl, #3 // PUD entry table type
|
|
|
|
str \tmp2, [\pud, \tmp1, lsl #3]
|
|
|
|
#else
|
|
|
|
mov \pud, \tbl
|
|
|
|
#endif
|
|
|
|
.endm
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Macro to populate the PGD (and possibily PUD) for the corresponding
|
|
|
|
* block entry in the next level (tbl) for the given virtual address.
|
|
|
|
*
|
|
|
|
* Preserves: pgd, virt
|
|
|
|
* Corrupts: tmp1, tmp2, tmp3
|
|
|
|
* Returns: tbl -> page where block mappings can be placed
|
|
|
|
* (changed to make room for pud with 4 levels, preserved otherwise)
|
|
|
|
*/
|
|
|
|
.macro create_pgd_entry, pgd, tbl, virt, tmp1, tmp2, tmp3
|
|
|
|
create_pud_entry \pgd, \tbl, \virt, \tmp3, \tmp1, \tmp2
|
2012-03-05 19:49:27 +08:00
|
|
|
lsr \tmp1, \virt, #PGDIR_SHIFT
|
|
|
|
and \tmp1, \tmp1, #PTRS_PER_PGD - 1 // PGD index
|
2014-05-12 17:40:51 +08:00
|
|
|
orr \tmp2, \tmp3, #3 // PGD entry table type
|
2012-03-05 19:49:27 +08:00
|
|
|
str \tmp2, [\pgd, \tmp1, lsl #3]
|
|
|
|
.endm
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Macro to populate block entries in the page table for the start..end
|
|
|
|
* virtual range (inclusive).
|
|
|
|
*
|
|
|
|
* Preserves: tbl, flags
|
|
|
|
* Corrupts: phys, start, end, pstate
|
|
|
|
*/
|
2014-02-17 20:03:25 +08:00
|
|
|
.macro create_block_map, tbl, flags, phys, start, end
|
2012-03-05 19:49:27 +08:00
|
|
|
lsr \phys, \phys, #BLOCK_SHIFT
|
|
|
|
lsr \start, \start, #BLOCK_SHIFT
|
|
|
|
and \start, \start, #PTRS_PER_PTE - 1 // table index
|
|
|
|
orr \phys, \flags, \phys, lsl #BLOCK_SHIFT // table entry
|
|
|
|
lsr \end, \end, #BLOCK_SHIFT
|
|
|
|
and \end, \end, #PTRS_PER_PTE - 1 // table end index
|
|
|
|
9999: str \phys, [\tbl, \start, lsl #3] // store the entry
|
|
|
|
add \start, \start, #1 // next entry
|
|
|
|
add \phys, \phys, #BLOCK_SIZE // next block
|
|
|
|
cmp \start, \end
|
|
|
|
b.ls 9999b
|
|
|
|
.endm
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Setup the initial page tables. We only setup the barest amount which is
|
|
|
|
* required to get the kernel running. The following sections are required:
|
|
|
|
* - identity mapping to enable the MMU (low address, TTBR0)
|
|
|
|
* - first few MB of the kernel linear mapping to jump to once the MMU has
|
|
|
|
* been enabled, including the FDT blob (TTBR1)
|
2014-04-08 06:39:52 +08:00
|
|
|
* - pgd entry for fixed mappings (TTBR1)
|
2012-03-05 19:49:27 +08:00
|
|
|
*/
|
|
|
|
__create_page_tables:
|
2014-06-24 23:51:35 +08:00
|
|
|
pgtbl x25, x26, x28 // idmap_pg_dir and swapper_pg_dir addresses
|
2014-03-27 02:25:55 +08:00
|
|
|
mov x27, lr
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Invalidate the idmap and swapper page tables to avoid potential
|
|
|
|
* dirty cache lines being evicted.
|
|
|
|
*/
|
|
|
|
mov x0, x25
|
|
|
|
add x1, x26, #SWAPPER_DIR_SIZE
|
|
|
|
bl __inval_cache_range
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Clear the idmap and swapper page tables.
|
|
|
|
*/
|
|
|
|
mov x0, x25
|
|
|
|
add x6, x26, #SWAPPER_DIR_SIZE
|
|
|
|
1: stp xzr, xzr, [x0], #16
|
|
|
|
stp xzr, xzr, [x0], #16
|
|
|
|
stp xzr, xzr, [x0], #16
|
|
|
|
stp xzr, xzr, [x0], #16
|
|
|
|
cmp x0, x6
|
|
|
|
b.lo 1b
|
|
|
|
|
|
|
|
ldr x7, =MM_MMUFLAGS
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Create the identity mapping.
|
|
|
|
*/
|
|
|
|
add x0, x25, #PAGE_SIZE // section table address
|
2014-02-17 20:03:25 +08:00
|
|
|
ldr x3, =KERNEL_START
|
|
|
|
add x3, x3, x28 // __pa(KERNEL_START)
|
2014-05-12 17:40:51 +08:00
|
|
|
create_pgd_entry x25, x0, x3, x1, x5, x6
|
2014-02-17 20:03:25 +08:00
|
|
|
ldr x6, =KERNEL_END
|
|
|
|
mov x5, x3 // __pa(KERNEL_START)
|
|
|
|
add x6, x6, x28 // __pa(KERNEL_END)
|
|
|
|
create_block_map x0, x7, x3, x5, x6
|
2012-03-05 19:49:27 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Map the kernel image (starting with PHYS_OFFSET).
|
|
|
|
*/
|
|
|
|
add x0, x26, #PAGE_SIZE // section table address
|
|
|
|
mov x5, #PAGE_OFFSET
|
2014-05-12 17:40:51 +08:00
|
|
|
create_pgd_entry x26, x0, x5, x1, x3, x6
|
2014-02-17 20:03:25 +08:00
|
|
|
ldr x6, =KERNEL_END
|
2012-03-05 19:49:27 +08:00
|
|
|
mov x3, x24 // phys offset
|
|
|
|
create_block_map x0, x7, x3, x5, x6
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Map the FDT blob (maximum 2MB; must be within 512MB of
|
|
|
|
* PHYS_OFFSET).
|
|
|
|
*/
|
|
|
|
mov x3, x21 // FDT phys address
|
|
|
|
and x3, x3, #~((1 << 21) - 1) // 2MB aligned
|
|
|
|
mov x6, #PAGE_OFFSET
|
|
|
|
sub x5, x3, x24 // subtract PHYS_OFFSET
|
|
|
|
tst x5, #~((1 << 29) - 1) // within 512MB?
|
|
|
|
csel x21, xzr, x21, ne // zero the FDT pointer
|
|
|
|
b.ne 1f
|
|
|
|
add x5, x5, x6 // __va(FDT blob)
|
|
|
|
add x6, x5, #1 << 21 // 2MB for the FDT blob
|
|
|
|
sub x6, x6, #1 // inclusive range
|
|
|
|
create_block_map x0, x7, x3, x5, x6
|
|
|
|
1:
|
2014-03-27 02:25:55 +08:00
|
|
|
/*
|
|
|
|
* Since the page tables have been populated with non-cacheable
|
|
|
|
* accesses (MMU disabled), invalidate the idmap and swapper page
|
|
|
|
* tables again to remove any speculatively loaded cache lines.
|
|
|
|
*/
|
|
|
|
mov x0, x25
|
|
|
|
add x1, x26, #SWAPPER_DIR_SIZE
|
|
|
|
bl __inval_cache_range
|
|
|
|
|
|
|
|
mov lr, x27
|
2012-03-05 19:49:27 +08:00
|
|
|
ret
|
|
|
|
ENDPROC(__create_page_tables)
|
|
|
|
.ltorg
|
|
|
|
|
|
|
|
.align 3
|
|
|
|
.type __switch_data, %object
|
|
|
|
__switch_data:
|
|
|
|
.quad __mmap_switched
|
|
|
|
.quad __bss_start // x6
|
2014-06-24 23:51:35 +08:00
|
|
|
.quad __bss_stop // x7
|
2012-03-05 19:49:27 +08:00
|
|
|
.quad processor_id // x4
|
|
|
|
.quad __fdt_pointer // x5
|
|
|
|
.quad memstart_addr // x6
|
|
|
|
.quad init_thread_union + THREAD_START_SP // sp
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The following fragment of code is executed with the MMU on in MMU mode, and
|
|
|
|
* uses absolute addresses; this is not position independent.
|
|
|
|
*/
|
|
|
|
__mmap_switched:
|
|
|
|
adr x3, __switch_data + 8
|
|
|
|
|
|
|
|
ldp x6, x7, [x3], #16
|
|
|
|
1: cmp x6, x7
|
|
|
|
b.hs 2f
|
|
|
|
str xzr, [x6], #8 // Clear BSS
|
|
|
|
b 1b
|
|
|
|
2:
|
|
|
|
ldp x4, x5, [x3], #16
|
|
|
|
ldr x6, [x3], #8
|
|
|
|
ldr x16, [x3]
|
|
|
|
mov sp, x16
|
|
|
|
str x22, [x4] // Save processor ID
|
|
|
|
str x21, [x5] // Save FDT pointer
|
|
|
|
str x24, [x6] // Save PHYS_OFFSET
|
|
|
|
mov x29, #0
|
|
|
|
b start_kernel
|
|
|
|
ENDPROC(__mmap_switched)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Exception handling. Something went wrong and we can't proceed. We ought to
|
|
|
|
* tell the user, but since we don't have any guarantee that we're even
|
|
|
|
* running on the right architecture, we do virtually nothing.
|
|
|
|
*/
|
|
|
|
__error_p:
|
|
|
|
ENDPROC(__error_p)
|
|
|
|
|
|
|
|
__error:
|
|
|
|
1: nop
|
|
|
|
b 1b
|
|
|
|
ENDPROC(__error)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This function gets the processor ID in w0 and searches the cpu_table[] for
|
|
|
|
* a match. It returns a pointer to the struct cpu_info it found. The
|
|
|
|
* cpu_table[] must end with an empty (all zeros) structure.
|
|
|
|
*
|
|
|
|
* This routine can be called via C code and it needs to work with the MMU
|
|
|
|
* both disabled and enabled (the offset is calculated automatically).
|
|
|
|
*/
|
|
|
|
ENTRY(lookup_processor_type)
|
|
|
|
adr x1, __lookup_processor_type_data
|
|
|
|
ldp x2, x3, [x1]
|
|
|
|
sub x1, x1, x2 // get offset between VA and PA
|
|
|
|
add x3, x3, x1 // convert VA to PA
|
|
|
|
1:
|
|
|
|
ldp w5, w6, [x3] // load cpu_id_val and cpu_id_mask
|
|
|
|
cbz w5, 2f // end of list?
|
|
|
|
and w6, w6, w0
|
|
|
|
cmp w5, w6
|
|
|
|
b.eq 3f
|
|
|
|
add x3, x3, #CPU_INFO_SZ
|
|
|
|
b 1b
|
|
|
|
2:
|
|
|
|
mov x3, #0 // unknown processor
|
|
|
|
3:
|
|
|
|
mov x0, x3
|
|
|
|
ret
|
|
|
|
ENDPROC(lookup_processor_type)
|
|
|
|
|
|
|
|
.align 3
|
|
|
|
.type __lookup_processor_type_data, %object
|
|
|
|
__lookup_processor_type_data:
|
|
|
|
.quad .
|
|
|
|
.quad cpu_table
|
|
|
|
.size __lookup_processor_type_data, . - __lookup_processor_type_data
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Determine validity of the x21 FDT pointer.
|
|
|
|
* The dtb must be 8-byte aligned and live in the first 512M of memory.
|
|
|
|
*/
|
|
|
|
__vet_fdt:
|
|
|
|
tst x21, #0x7
|
|
|
|
b.ne 1f
|
|
|
|
cmp x21, x24
|
|
|
|
b.lt 1f
|
|
|
|
mov x0, #(1 << 29)
|
|
|
|
add x0, x0, x24
|
|
|
|
cmp x21, x0
|
|
|
|
b.ge 1f
|
|
|
|
ret
|
|
|
|
1:
|
|
|
|
mov x21, #0
|
|
|
|
ret
|
|
|
|
ENDPROC(__vet_fdt)
|