diff options
Diffstat (limited to 'arch/x86_64/kernel/trampoline.S')
| -rw-r--r-- | arch/x86_64/kernel/trampoline.S | 123 |
1 files changed, 109 insertions, 14 deletions
diff --git a/arch/x86_64/kernel/trampoline.S b/arch/x86_64/kernel/trampoline.S index c79b99a9e2f6..e7e2764c461b 100644 --- a/arch/x86_64/kernel/trampoline.S +++ b/arch/x86_64/kernel/trampoline.S | |||
| @@ -3,6 +3,7 @@ | |||
| 3 | * Trampoline.S Derived from Setup.S by Linus Torvalds | 3 | * Trampoline.S Derived from Setup.S by Linus Torvalds |
| 4 | * | 4 | * |
| 5 | * 4 Jan 1997 Michael Chastain: changed to gnu as. | 5 | * 4 Jan 1997 Michael Chastain: changed to gnu as. |
| 6 | * 15 Sept 2005 Eric Biederman: 64bit PIC support | ||
| 6 | * | 7 | * |
| 7 | * Entry: CS:IP point to the start of our code, we are | 8 | * Entry: CS:IP point to the start of our code, we are |
| 8 | * in real mode with no stack, but the rest of the | 9 | * in real mode with no stack, but the rest of the |
| @@ -17,15 +18,20 @@ | |||
| 17 | * and IP is zero. Thus, data addresses need to be absolute | 18 | * and IP is zero. Thus, data addresses need to be absolute |
| 18 | * (no relocation) and are taken with regard to r_base. | 19 | * (no relocation) and are taken with regard to r_base. |
| 19 | * | 20 | * |
| 21 | * With the addition of trampoline_level4_pgt this code can | ||
| 22 | * now enter a 64bit kernel that lives at arbitrary 64bit | ||
| 23 | * physical addresses. | ||
| 24 | * | ||
| 20 | * If you work on this file, check the object module with objdump | 25 | * If you work on this file, check the object module with objdump |
| 21 | * --full-contents --reloc to make sure there are no relocation | 26 | * --full-contents --reloc to make sure there are no relocation |
| 22 | * entries. For the GDT entry we do hand relocation in smpboot.c | 27 | * entries. |
| 23 | * because of 64bit linker limitations. | ||
| 24 | */ | 28 | */ |
| 25 | 29 | ||
| 26 | #include <linux/linkage.h> | 30 | #include <linux/linkage.h> |
| 27 | #include <asm/segment.h> | 31 | #include <asm/pgtable.h> |
| 28 | #include <asm/page.h> | 32 | #include <asm/page.h> |
| 33 | #include <asm/msr.h> | ||
| 34 | #include <asm/segment.h> | ||
| 29 | 35 | ||
| 30 | .data | 36 | .data |
| 31 | 37 | ||
| @@ -33,15 +39,33 @@ | |||
| 33 | 39 | ||
| 34 | ENTRY(trampoline_data) | 40 | ENTRY(trampoline_data) |
| 35 | r_base = . | 41 | r_base = . |
| 42 | cli # We should be safe anyway | ||
| 36 | wbinvd | 43 | wbinvd |
| 37 | mov %cs, %ax # Code and data in the same place | 44 | mov %cs, %ax # Code and data in the same place |
| 38 | mov %ax, %ds | 45 | mov %ax, %ds |
| 46 | mov %ax, %es | ||
| 47 | mov %ax, %ss | ||
| 39 | 48 | ||
| 40 | cli # We should be safe anyway | ||
| 41 | 49 | ||
| 42 | movl $0xA5A5A5A5, trampoline_data - r_base | 50 | movl $0xA5A5A5A5, trampoline_data - r_base |
| 43 | # write marker for master knows we're running | 51 | # write marker for master knows we're running |
| 44 | 52 | ||
| 53 | # Setup stack | ||
| 54 | movw $(trampoline_stack_end - r_base), %sp | ||
| 55 | |||
| 56 | call verify_cpu # Verify the cpu supports long mode | ||
| 57 | testl %eax, %eax # Check for return code | ||
| 58 | jnz no_longmode | ||
| 59 | |||
| 60 | mov %cs, %ax | ||
| 61 | movzx %ax, %esi # Find the 32bit trampoline location | ||
| 62 | shll $4, %esi | ||
| 63 | |||
| 64 | # Fixup the vectors | ||
| 65 | addl %esi, startup_32_vector - r_base | ||
| 66 | addl %esi, startup_64_vector - r_base | ||
| 67 | addl %esi, tgdt + 2 - r_base # Fixup the gdt pointer | ||
| 68 | |||
| 45 | /* | 69 | /* |
| 46 | * GDT tables in non default location kernel can be beyond 16MB and | 70 | * GDT tables in non default location kernel can be beyond 16MB and |
| 47 | * lgdt will not be able to load the address as in real mode default | 71 | * lgdt will not be able to load the address as in real mode default |
| @@ -49,23 +73,94 @@ r_base = . | |||
| 49 | * to 32 bit. | 73 | * to 32 bit. |
| 50 | */ | 74 | */ |
| 51 | 75 | ||
| 52 | lidtl idt_48 - r_base # load idt with 0, 0 | 76 | lidtl tidt - r_base # load idt with 0, 0 |
| 53 | lgdtl gdt_48 - r_base # load gdt with whatever is appropriate | 77 | lgdtl tgdt - r_base # load gdt with whatever is appropriate |
| 54 | 78 | ||
| 55 | xor %ax, %ax | 79 | xor %ax, %ax |
| 56 | inc %ax # protected mode (PE) bit | 80 | inc %ax # protected mode (PE) bit |
| 57 | lmsw %ax # into protected mode | 81 | lmsw %ax # into protected mode |
| 58 | # flaush prefetch and jump to startup_32 in arch/x86_64/kernel/head.S | 82 | |
| 59 | ljmpl $__KERNEL32_CS, $(startup_32-__START_KERNEL_map) | 83 | # flush prefetch and jump to startup_32 |
| 84 | ljmpl *(startup_32_vector - r_base) | ||
| 85 | |||
| 86 | .code32 | ||
| 87 | .balign 4 | ||
| 88 | startup_32: | ||
| 89 | movl $__KERNEL_DS, %eax # Initialize the %ds segment register | ||
| 90 | movl %eax, %ds | ||
| 91 | |||
| 92 | xorl %eax, %eax | ||
| 93 | btsl $5, %eax # Enable PAE mode | ||
| 94 | movl %eax, %cr4 | ||
| 95 | |||
| 96 | # Setup trampoline 4 level pagetables | ||
| 97 | leal (trampoline_level4_pgt - r_base)(%esi), %eax | ||
| 98 | movl %eax, %cr3 | ||
| 99 | |||
| 100 | movl $MSR_EFER, %ecx | ||
| 101 | movl $(1 << _EFER_LME), %eax # Enable Long Mode | ||
| 102 | xorl %edx, %edx | ||
| 103 | wrmsr | ||
| 104 | |||
| 105 | xorl %eax, %eax | ||
| 106 | btsl $31, %eax # Enable paging and in turn activate Long Mode | ||
| 107 | btsl $0, %eax # Enable protected mode | ||
| 108 | movl %eax, %cr0 | ||
| 109 | |||
| 110 | /* | ||
| 111 | * At this point we're in long mode but in 32bit compatibility mode | ||
| 112 | * with EFER.LME = 1, CS.L = 0, CS.D = 1 (and in turn | ||
| 113 | * EFER.LMA = 1). Now we want to jump in 64bit mode, to do that we use | ||
| 114 | * the new gdt/idt that has __KERNEL_CS with CS.L = 1. | ||
| 115 | */ | ||
| 116 | ljmp *(startup_64_vector - r_base)(%esi) | ||
| 117 | |||
| 118 | .code64 | ||
| 119 | .balign 4 | ||
| 120 | startup_64: | ||
| 121 | # Now jump into the kernel using virtual addresses | ||
| 122 | movq $secondary_startup_64, %rax | ||
| 123 | jmp *%rax | ||
| 124 | |||
| 125 | .code16 | ||
| 126 | no_longmode: | ||
| 127 | hlt | ||
| 128 | jmp no_longmode | ||
| 129 | #include "verify_cpu.S" | ||
| 60 | 130 | ||
| 61 | # Careful these need to be in the same 64K segment as the above; | 131 | # Careful these need to be in the same 64K segment as the above; |
| 62 | idt_48: | 132 | tidt: |
| 63 | .word 0 # idt limit = 0 | 133 | .word 0 # idt limit = 0 |
| 64 | .word 0, 0 # idt base = 0L | 134 | .word 0, 0 # idt base = 0L |
| 65 | 135 | ||
| 66 | gdt_48: | 136 | # Duplicate the global descriptor table |
| 67 | .short GDT_ENTRIES*8 - 1 # gdt limit | 137 | # so the kernel can live anywhere |
| 68 | .long cpu_gdt_table-__START_KERNEL_map | 138 | .balign 4 |
| 139 | tgdt: | ||
| 140 | .short tgdt_end - tgdt # gdt limit | ||
| 141 | .long tgdt - r_base | ||
| 142 | .short 0 | ||
| 143 | .quad 0x00cf9b000000ffff # __KERNEL32_CS | ||
| 144 | .quad 0x00af9b000000ffff # __KERNEL_CS | ||
| 145 | .quad 0x00cf93000000ffff # __KERNEL_DS | ||
| 146 | tgdt_end: | ||
| 147 | |||
| 148 | .balign 4 | ||
| 149 | startup_32_vector: | ||
| 150 | .long startup_32 - r_base | ||
| 151 | .word __KERNEL32_CS, 0 | ||
| 152 | |||
| 153 | .balign 4 | ||
| 154 | startup_64_vector: | ||
| 155 | .long startup_64 - r_base | ||
| 156 | .word __KERNEL_CS, 0 | ||
| 157 | |||
| 158 | trampoline_stack: | ||
| 159 | .org 0x1000 | ||
| 160 | trampoline_stack_end: | ||
| 161 | ENTRY(trampoline_level4_pgt) | ||
| 162 | .quad level3_ident_pgt - __START_KERNEL_map + _KERNPG_TABLE | ||
| 163 | .fill 510,8,0 | ||
| 164 | .quad level3_kernel_pgt - __START_KERNEL_map + _KERNPG_TABLE | ||
| 69 | 165 | ||
| 70 | .globl trampoline_end | 166 | ENTRY(trampoline_end) |
| 71 | trampoline_end: | ||
