Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
| 2 | * |
| 3 | * Trampoline.S Derived from Setup.S by Linus Torvalds |
| 4 | * |
| 5 | * 4 Jan 1997 Michael Chastain: changed to gnu as. |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 6 | * 15 Sept 2005 Eric Biederman: 64bit PIC support |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 7 | * |
| 8 | * Entry: CS:IP point to the start of our code, we are |
| 9 | * in real mode with no stack, but the rest of the |
| 10 | * trampoline page to make our stack and everything else |
| 11 | * is a mystery. |
| 12 | * |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 13 | * On entry to trampoline_data, the processor is in real mode |
| 14 | * with 16-bit addressing and 16-bit data. CS has some value |
| 15 | * and IP is zero. Thus, data addresses need to be absolute |
| 16 | * (no relocation) and are taken with regard to r_base. |
| 17 | * |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 18 | * With the addition of trampoline_level4_pgt this code can |
| 19 | * now enter a 64bit kernel that lives at arbitrary 64bit |
| 20 | * physical addresses. |
| 21 | * |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 22 | * If you work on this file, check the object module with objdump |
| 23 | * --full-contents --reloc to make sure there are no relocation |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 24 | * entries. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 25 | */ |
| 26 | |
| 27 | #include <linux/linkage.h> |
Jan Beulich | 5f68563 | 2009-09-04 09:16:22 +0100 | [diff] [blame] | 28 | #include <linux/init.h> |
Jeremy Fitzhardinge | 0341c14 | 2009-02-13 11:14:01 -0800 | [diff] [blame] | 29 | #include <asm/pgtable_types.h> |
| 30 | #include <asm/page_types.h> |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 31 | #include <asm/msr.h> |
| 32 | #include <asm/segment.h> |
Cyrill Gorcunov | 0a1e886 | 2009-01-28 23:21:25 +0300 | [diff] [blame] | 33 | #include <asm/processor-flags.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 34 | |
Jan Beulich | 7a4b7e5 | 2009-10-06 16:32:43 +0100 | [diff] [blame] | 35 | #ifdef CONFIG_ACPI_SLEEP |
| 36 | .section .rodata, "a", @progbits |
| 37 | #else |
Jan Beulich | 5f68563 | 2009-09-04 09:16:22 +0100 | [diff] [blame] | 38 | /* We can free up the trampoline after bootup if cpu hotplug is not supported. */ |
| 39 | __CPUINITRODATA |
Jan Beulich | 7a4b7e5 | 2009-10-06 16:32:43 +0100 | [diff] [blame] | 40 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 41 | .code16 |
| 42 | |
| 43 | ENTRY(trampoline_data) |
| 44 | r_base = . |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 45 | cli # We should be safe anyway |
Cyrill Gorcunov | 0a1e886 | 2009-01-28 23:21:25 +0300 | [diff] [blame] | 46 | wbinvd |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 47 | mov %cs, %ax # Code and data in the same place |
| 48 | mov %ax, %ds |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 49 | mov %ax, %es |
| 50 | mov %ax, %ss |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 51 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 52 | |
| 53 | movl $0xA5A5A5A5, trampoline_data - r_base |
| 54 | # write marker for master knows we're running |
| 55 | |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 56 | # Setup stack |
| 57 | movw $(trampoline_stack_end - r_base), %sp |
| 58 | |
| 59 | call verify_cpu # Verify the cpu supports long mode |
Vivek Goyal | a4831e0 | 2007-05-02 19:27:08 +0200 | [diff] [blame] | 60 | testl %eax, %eax # Check for return code |
| 61 | jnz no_longmode |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 62 | |
| 63 | mov %cs, %ax |
| 64 | movzx %ax, %esi # Find the 32bit trampoline location |
| 65 | shll $4, %esi |
| 66 | |
| 67 | # Fixup the vectors |
| 68 | addl %esi, startup_32_vector - r_base |
| 69 | addl %esi, startup_64_vector - r_base |
| 70 | addl %esi, tgdt + 2 - r_base # Fixup the gdt pointer |
| 71 | |
Vivek Goyal | 983d5db | 2006-01-12 03:35:20 +0100 | [diff] [blame] | 72 | /* |
| 73 | * GDT tables in non default location kernel can be beyond 16MB and |
| 74 | * lgdt will not be able to load the address as in real mode default |
| 75 | * operand size is 16bit. Use lgdtl instead to force operand size |
| 76 | * to 32 bit. |
| 77 | */ |
| 78 | |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 79 | lidtl tidt - r_base # load idt with 0, 0 |
| 80 | lgdtl tgdt - r_base # load gdt with whatever is appropriate |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 81 | |
Cyrill Gorcunov | 0a1e886 | 2009-01-28 23:21:25 +0300 | [diff] [blame] | 82 | mov $X86_CR0_PE, %ax # protected mode (PE) bit |
| 83 | lmsw %ax # into protected mode |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 84 | |
| 85 | # flush prefetch and jump to startup_32 |
| 86 | ljmpl *(startup_32_vector - r_base) |
| 87 | |
| 88 | .code32 |
| 89 | .balign 4 |
| 90 | startup_32: |
| 91 | movl $__KERNEL_DS, %eax # Initialize the %ds segment register |
| 92 | movl %eax, %ds |
| 93 | |
Cyrill Gorcunov | 0a1e886 | 2009-01-28 23:21:25 +0300 | [diff] [blame] | 94 | movl $X86_CR4_PAE, %eax |
| 95 | movl %eax, %cr4 # Enable PAE mode |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 96 | |
| 97 | # Setup trampoline 4 level pagetables |
| 98 | leal (trampoline_level4_pgt - r_base)(%esi), %eax |
| 99 | movl %eax, %cr3 |
| 100 | |
| 101 | movl $MSR_EFER, %ecx |
| 102 | movl $(1 << _EFER_LME), %eax # Enable Long Mode |
| 103 | xorl %edx, %edx |
| 104 | wrmsr |
| 105 | |
Cyrill Gorcunov | 0a1e886 | 2009-01-28 23:21:25 +0300 | [diff] [blame] | 106 | # Enable paging and in turn activate Long Mode |
| 107 | # Enable protected mode |
| 108 | movl $(X86_CR0_PG | X86_CR0_PE), %eax |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 109 | movl %eax, %cr0 |
| 110 | |
| 111 | /* |
| 112 | * At this point we're in long mode but in 32bit compatibility mode |
| 113 | * with EFER.LME = 1, CS.L = 0, CS.D = 1 (and in turn |
| 114 | * EFER.LMA = 1). Now we want to jump in 64bit mode, to do that we use |
| 115 | * the new gdt/idt that has __KERNEL_CS with CS.L = 1. |
| 116 | */ |
| 117 | ljmp *(startup_64_vector - r_base)(%esi) |
| 118 | |
| 119 | .code64 |
| 120 | .balign 4 |
| 121 | startup_64: |
| 122 | # Now jump into the kernel using virtual addresses |
| 123 | movq $secondary_startup_64, %rax |
| 124 | jmp *%rax |
| 125 | |
| 126 | .code16 |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 127 | no_longmode: |
| 128 | hlt |
| 129 | jmp no_longmode |
Thomas Gleixner | e0a84f6 | 2007-10-11 11:15:19 +0200 | [diff] [blame] | 130 | #include "verify_cpu_64.S" |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 131 | |
| 132 | # Careful these need to be in the same 64K segment as the above; |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 133 | tidt: |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 134 | .word 0 # idt limit = 0 |
| 135 | .word 0, 0 # idt base = 0L |
| 136 | |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 137 | # Duplicate the global descriptor table |
| 138 | # so the kernel can live anywhere |
| 139 | .balign 4 |
| 140 | tgdt: |
| 141 | .short tgdt_end - tgdt # gdt limit |
| 142 | .long tgdt - r_base |
| 143 | .short 0 |
| 144 | .quad 0x00cf9b000000ffff # __KERNEL32_CS |
| 145 | .quad 0x00af9b000000ffff # __KERNEL_CS |
| 146 | .quad 0x00cf93000000ffff # __KERNEL_DS |
| 147 | tgdt_end: |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 148 | |
Vivek Goyal | 90b1c20 | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 149 | .balign 4 |
| 150 | startup_32_vector: |
| 151 | .long startup_32 - r_base |
| 152 | .word __KERNEL32_CS, 0 |
| 153 | |
| 154 | .balign 4 |
| 155 | startup_64_vector: |
| 156 | .long startup_64 - r_base |
| 157 | .word __KERNEL_CS, 0 |
| 158 | |
| 159 | trampoline_stack: |
| 160 | .org 0x1000 |
| 161 | trampoline_stack_end: |
| 162 | ENTRY(trampoline_level4_pgt) |
| 163 | .quad level3_ident_pgt - __START_KERNEL_map + _KERNPG_TABLE |
| 164 | .fill 510,8,0 |
| 165 | .quad level3_kernel_pgt - __START_KERNEL_map + _KERNPG_TABLE |
| 166 | |
| 167 | ENTRY(trampoline_end) |