diff options
author | Vivek Goyal <vgoyal@in.ibm.com> | 2007-05-02 13:27:07 -0400 |
---|---|---|
committer | Andi Kleen <andi@basil.nowhere.org> | 2007-05-02 13:27:07 -0400 |
commit | 275f55170ec2b5d777b070cb8ab9e5d58e65a2a8 (patch) | |
tree | b1124f3cac6975a9ef2a5a65849f9c68e71c1eab | |
parent | 7db681d7e4038ad205b5face5cf7f7815633e1b5 (diff) |
[PATCH] x86-64: wakeup.S misc cleanups
o Various cleanups. One of the main purpose of cleanups is that make
wakeup.S as close as possible to trampoline.S.
o Following are the changes
- Indentations for comments.
- Changed the gdt table to compact form and to resemble the
one in trampoline.S
- Take the jump to 32bit from real mode using ljmpl. Makes code
more readable.
- After enabling long mode, directly take a long jump for 64bit
mode. No need to take an extra jump to "reach_comaptibility_mode"
- Stack is not used after real mode. So don't load stack in
32 bit mode.
- No need to enable PGE here.
- No need to do extra EFER read, anyway we trash the read contents.
- No need to enable system call (EFER_SCE). Anyway it will be
enabled when original EFER is restored.
- No need to set MP, ET, NE, WP, AM bits in cr0. Very soon we will
reload the original cr0 while restroing the processor state.
Signed-off-by: Eric W. Biederman <ebiederm@xmission.com>
Signed-off-by: Vivek Goyal <vgoyal@in.ibm.com>
Signed-off-by: Andi Kleen <ak@suse.de>
-rw-r--r-- | arch/x86_64/kernel/acpi/wakeup.S | 112 |
1 files changed, 40 insertions, 72 deletions
diff --git a/arch/x86_64/kernel/acpi/wakeup.S b/arch/x86_64/kernel/acpi/wakeup.S index 17dbeff64eef..bd4c6f1a6f32 100644 --- a/arch/x86_64/kernel/acpi/wakeup.S +++ b/arch/x86_64/kernel/acpi/wakeup.S | |||
@@ -30,11 +30,12 @@ wakeup_code: | |||
30 | cld | 30 | cld |
31 | # setup data segment | 31 | # setup data segment |
32 | movw %cs, %ax | 32 | movw %cs, %ax |
33 | movw %ax, %ds # Make ds:0 point to wakeup_start | 33 | movw %ax, %ds # Make ds:0 point to wakeup_start |
34 | movw %ax, %ss | 34 | movw %ax, %ss |
35 | mov $(wakeup_stack - wakeup_code), %sp # Private stack is needed for ASUS board | 35 | # Private stack is needed for ASUS board |
36 | mov $(wakeup_stack - wakeup_code), %sp | ||
36 | 37 | ||
37 | pushl $0 # Kill any dangerous flags | 38 | pushl $0 # Kill any dangerous flags |
38 | popfl | 39 | popfl |
39 | 40 | ||
40 | movl real_magic - wakeup_code, %eax | 41 | movl real_magic - wakeup_code, %eax |
@@ -45,7 +46,7 @@ wakeup_code: | |||
45 | jz 1f | 46 | jz 1f |
46 | lcall $0xc000,$3 | 47 | lcall $0xc000,$3 |
47 | movw %cs, %ax | 48 | movw %cs, %ax |
48 | movw %ax, %ds # Bios might have played with that | 49 | movw %ax, %ds # Bios might have played with that |
49 | movw %ax, %ss | 50 | movw %ax, %ss |
50 | 1: | 51 | 1: |
51 | 52 | ||
@@ -75,9 +76,12 @@ wakeup_code: | |||
75 | jmp 1f | 76 | jmp 1f |
76 | 1: | 77 | 1: |
77 | 78 | ||
78 | .byte 0x66, 0xea # prefix + jmpi-opcode | 79 | ljmpl *(wakeup_32_vector - wakeup_code) |
79 | .long wakeup_32 - __START_KERNEL_map | 80 | |
80 | .word __KERNEL_CS | 81 | .balign 4 |
82 | wakeup_32_vector: | ||
83 | .long wakeup_32 - __START_KERNEL_map | ||
84 | .word __KERNEL32_CS, 0 | ||
81 | 85 | ||
82 | .code32 | 86 | .code32 |
83 | wakeup_32: | 87 | wakeup_32: |
@@ -96,65 +100,50 @@ wakeup_32: | |||
96 | jnc bogus_cpu | 100 | jnc bogus_cpu |
97 | movl %edx,%edi | 101 | movl %edx,%edi |
98 | 102 | ||
99 | movw $__KERNEL_DS, %ax | 103 | movl $__KERNEL_DS, %eax |
100 | movw %ax, %ds | 104 | movl %eax, %ds |
101 | movw %ax, %es | ||
102 | movw %ax, %fs | ||
103 | movw %ax, %gs | ||
104 | 105 | ||
105 | movw $__KERNEL_DS, %ax | ||
106 | movw %ax, %ss | ||
107 | |||
108 | mov $(wakeup_stack - __START_KERNEL_map), %esp | ||
109 | movl saved_magic - __START_KERNEL_map, %eax | 106 | movl saved_magic - __START_KERNEL_map, %eax |
110 | cmpl $0x9abcdef0, %eax | 107 | cmpl $0x9abcdef0, %eax |
111 | jne bogus_32_magic | 108 | jne bogus_32_magic |
112 | 109 | ||
110 | movw $0x0e00 + 'i', %ds:(0xb8012) | ||
111 | movb $0xa8, %al ; outb %al, $0x80; | ||
112 | |||
113 | /* | 113 | /* |
114 | * Prepare for entering 64bits mode | 114 | * Prepare for entering 64bits mode |
115 | */ | 115 | */ |
116 | 116 | ||
117 | /* Enable PAE mode and PGE */ | 117 | /* Enable PAE */ |
118 | xorl %eax, %eax | 118 | xorl %eax, %eax |
119 | btsl $5, %eax | 119 | btsl $5, %eax |
120 | btsl $7, %eax | ||
121 | movl %eax, %cr4 | 120 | movl %eax, %cr4 |
122 | 121 | ||
123 | /* Setup early boot stage 4 level pagetables */ | 122 | /* Setup early boot stage 4 level pagetables */ |
124 | movl $(wakeup_level4_pgt - __START_KERNEL_map), %eax | 123 | movl $(wakeup_level4_pgt - __START_KERNEL_map), %eax |
125 | movl %eax, %cr3 | 124 | movl %eax, %cr3 |
126 | 125 | ||
127 | /* Setup EFER (Extended Feature Enable Register) */ | ||
128 | movl $MSR_EFER, %ecx | ||
129 | rdmsr | ||
130 | /* Fool rdmsr and reset %eax to avoid dependences */ | ||
131 | xorl %eax, %eax | ||
132 | /* Enable Long Mode */ | 126 | /* Enable Long Mode */ |
127 | xorl %eax, %eax | ||
133 | btsl $_EFER_LME, %eax | 128 | btsl $_EFER_LME, %eax |
134 | /* Enable System Call */ | ||
135 | btsl $_EFER_SCE, %eax | ||
136 | 129 | ||
137 | /* No Execute supported? */ | 130 | /* No Execute supported? */ |
138 | btl $20,%edi | 131 | btl $20,%edi |
139 | jnc 1f | 132 | jnc 1f |
140 | btsl $_EFER_NX, %eax | 133 | btsl $_EFER_NX, %eax |
141 | 1: | ||
142 | 134 | ||
143 | /* Make changes effective */ | 135 | /* Make changes effective */ |
136 | 1: movl $MSR_EFER, %ecx | ||
137 | xorl %edx, %edx | ||
144 | wrmsr | 138 | wrmsr |
145 | wbinvd | ||
146 | 139 | ||
147 | xorl %eax, %eax | 140 | xorl %eax, %eax |
148 | btsl $31, %eax /* Enable paging and in turn activate Long Mode */ | 141 | btsl $31, %eax /* Enable paging and in turn activate Long Mode */ |
149 | btsl $0, %eax /* Enable protected mode */ | 142 | btsl $0, %eax /* Enable protected mode */ |
150 | btsl $1, %eax /* Enable MP */ | ||
151 | btsl $4, %eax /* Enable ET */ | ||
152 | btsl $5, %eax /* Enable NE */ | ||
153 | btsl $16, %eax /* Enable WP */ | ||
154 | btsl $18, %eax /* Enable AM */ | ||
155 | 143 | ||
156 | /* Make changes effective */ | 144 | /* Make changes effective */ |
157 | movl %eax, %cr0 | 145 | movl %eax, %cr0 |
146 | |||
158 | /* At this point: | 147 | /* At this point: |
159 | CR4.PAE must be 1 | 148 | CR4.PAE must be 1 |
160 | CS.L must be 0 | 149 | CS.L must be 0 |
@@ -162,11 +151,6 @@ wakeup_32: | |||
162 | Next instruction must be a branch | 151 | Next instruction must be a branch |
163 | This must be on identity-mapped page | 152 | This must be on identity-mapped page |
164 | */ | 153 | */ |
165 | jmp reach_compatibility_mode | ||
166 | reach_compatibility_mode: | ||
167 | movw $0x0e00 + 'i', %ds:(0xb8012) | ||
168 | movb $0xa8, %al ; outb %al, $0x80; | ||
169 | |||
170 | /* | 154 | /* |
171 | * At this point we're in long mode but in 32bit compatibility mode | 155 | * At this point we're in long mode but in 32bit compatibility mode |
172 | * with EFER.LME = 1, CS.L = 0, CS.D = 1 (and in turn | 156 | * with EFER.LME = 1, CS.L = 0, CS.D = 1 (and in turn |
@@ -174,24 +158,19 @@ reach_compatibility_mode: | |||
174 | * the new gdt/idt that has __KERNEL_CS with CS.L = 1. | 158 | * the new gdt/idt that has __KERNEL_CS with CS.L = 1. |
175 | */ | 159 | */ |
176 | 160 | ||
177 | movw $0x0e00 + 'n', %ds:(0xb8014) | ||
178 | movb $0xa9, %al ; outb %al, $0x80 | ||
179 | |||
180 | /* Load new GDT with the 64bit segment using 32bit descriptor */ | ||
181 | movl $(pGDT32 - __START_KERNEL_map), %eax | ||
182 | lgdt (%eax) | ||
183 | |||
184 | movl $(wakeup_jumpvector - __START_KERNEL_map), %eax | ||
185 | /* Finally jump in 64bit mode */ | 161 | /* Finally jump in 64bit mode */ |
186 | ljmp *(%eax) | 162 | ljmp *(wakeup_long64_vector - __START_KERNEL_map) |
187 | 163 | ||
188 | wakeup_jumpvector: | 164 | .balign 4 |
189 | .long wakeup_long64 - __START_KERNEL_map | 165 | wakeup_long64_vector: |
190 | .word __KERNEL_CS | 166 | .long wakeup_long64 - __START_KERNEL_map |
167 | .word __KERNEL_CS, 0 | ||
191 | 168 | ||
192 | .code64 | 169 | .code64 |
193 | 170 | ||
194 | /* Hooray, we are in Long 64-bit mode (but still running in low memory) */ | 171 | /* Hooray, we are in Long 64-bit mode (but still running in |
172 | * low memory) | ||
173 | */ | ||
195 | wakeup_long64: | 174 | wakeup_long64: |
196 | /* | 175 | /* |
197 | * We must switch to a new descriptor in kernel space for the GDT | 176 | * We must switch to a new descriptor in kernel space for the GDT |
@@ -201,6 +180,9 @@ wakeup_long64: | |||
201 | */ | 180 | */ |
202 | lgdt cpu_gdt_descr - __START_KERNEL_map | 181 | lgdt cpu_gdt_descr - __START_KERNEL_map |
203 | 182 | ||
183 | movw $0x0e00 + 'n', %ds:(0xb8014) | ||
184 | movb $0xa9, %al ; outb %al, $0x80 | ||
185 | |||
204 | movw $0x0e00 + 'u', %ds:(0xb8016) | 186 | movw $0x0e00 + 'u', %ds:(0xb8016) |
205 | 187 | ||
206 | nop | 188 | nop |
@@ -227,33 +209,19 @@ wakeup_long64: | |||
227 | 209 | ||
228 | .align 64 | 210 | .align 64 |
229 | gdta: | 211 | gdta: |
212 | /* Its good to keep gdt in sync with one in trampoline.S */ | ||
230 | .word 0, 0, 0, 0 # dummy | 213 | .word 0, 0, 0, 0 # dummy |
231 | 214 | /* ??? Why I need the accessed bit set in order for this to work? */ | |
232 | .word 0, 0, 0, 0 # unused | 215 | .quad 0x00cf9b000000ffff # __KERNEL32_CS |
233 | 216 | .quad 0x00af9b000000ffff # __KERNEL_CS | |
234 | .word 0xFFFF # 4Gb - (0x100000*0x1000 = 4Gb) | 217 | .quad 0x00cf93000000ffff # __KERNEL_DS |
235 | .word 0 # base address = 0 | ||
236 | .word 0x9B00 # code read/exec. ??? Why I need 0x9B00 (as opposed to 0x9A00 in order for this to work?) | ||
237 | .word 0x00CF # granularity = 4096, 386 | ||
238 | # (+5th nibble of limit) | ||
239 | |||
240 | .word 0xFFFF # 4Gb - (0x100000*0x1000 = 4Gb) | ||
241 | .word 0 # base address = 0 | ||
242 | .word 0x9200 # data read/write | ||
243 | .word 0x00CF # granularity = 4096, 386 | ||
244 | # (+5th nibble of limit) | ||
245 | # this is 64bit descriptor for code | ||
246 | .word 0xFFFF | ||
247 | .word 0 | ||
248 | .word 0x9A00 # code read/exec | ||
249 | .word 0x00AF # as above, but it is long mode and with D=0 | ||
250 | 218 | ||
251 | idt_48a: | 219 | idt_48a: |
252 | .word 0 # idt limit = 0 | 220 | .word 0 # idt limit = 0 |
253 | .word 0, 0 # idt base = 0L | 221 | .word 0, 0 # idt base = 0L |
254 | 222 | ||
255 | gdt_48a: | 223 | gdt_48a: |
256 | .word 0x8000 # gdt limit=2048, | 224 | .word 0x800 # gdt limit=2048, |
257 | # 256 GDT entries | 225 | # 256 GDT entries |
258 | .word 0, 0 # gdt base (filled in later) | 226 | .word 0, 0 # gdt base (filled in later) |
259 | 227 | ||
@@ -263,7 +231,7 @@ video_mode: .quad 0 | |||
263 | video_flags: .quad 0 | 231 | video_flags: .quad 0 |
264 | 232 | ||
265 | bogus_real_magic: | 233 | bogus_real_magic: |
266 | movb $0xba,%al ; outb %al,$0x80 | 234 | movb $0xba,%al ; outb %al,$0x80 |
267 | jmp bogus_real_magic | 235 | jmp bogus_real_magic |
268 | 236 | ||
269 | bogus_32_magic: | 237 | bogus_32_magic: |