aboutsummaryrefslogtreecommitdiffstats
path: root/arch/x86/kernel/process_64.c
diff options
context:
space:
mode:
authorLen Brown <len.brown@intel.com>2008-10-22 23:57:26 -0400
committerLen Brown <len.brown@intel.com>2008-10-23 00:11:07 -0400
commit057316cc6a5b521b332a1d7ccc871cd60c904c74 (patch)
tree4333e608da237c73ff69b10878025cca96dcb4c8 /arch/x86/kernel/process_64.c
parent3e2dab9a1c2deb03c311eb3f83466009147ed4d3 (diff)
parent2515ddc6db8eb49a79f0fe5e67ff09ac7c81eab4 (diff)
Merge branch 'linus' into test
Conflicts: MAINTAINERS arch/x86/kernel/acpi/boot.c arch/x86/kernel/acpi/sleep.c drivers/acpi/Kconfig drivers/pnp/Makefile drivers/pnp/quirks.c Signed-off-by: Len Brown <len.brown@intel.com>
Diffstat (limited to 'arch/x86/kernel/process_64.c')
-rw-r--r--arch/x86/kernel/process_64.c199
1 files changed, 104 insertions, 95 deletions
diff --git a/arch/x86/kernel/process_64.c b/arch/x86/kernel/process_64.c
index 3e3d503eadcf..c958120fb1b6 100644
--- a/arch/x86/kernel/process_64.c
+++ b/arch/x86/kernel/process_64.c
@@ -37,11 +37,11 @@
37#include <linux/kdebug.h> 37#include <linux/kdebug.h>
38#include <linux/tick.h> 38#include <linux/tick.h>
39#include <linux/prctl.h> 39#include <linux/prctl.h>
40#include <linux/uaccess.h>
41#include <linux/io.h>
40 42
41#include <asm/uaccess.h>
42#include <asm/pgtable.h> 43#include <asm/pgtable.h>
43#include <asm/system.h> 44#include <asm/system.h>
44#include <asm/io.h>
45#include <asm/processor.h> 45#include <asm/processor.h>
46#include <asm/i387.h> 46#include <asm/i387.h>
47#include <asm/mmu_context.h> 47#include <asm/mmu_context.h>
@@ -51,6 +51,7 @@
51#include <asm/proto.h> 51#include <asm/proto.h>
52#include <asm/ia32.h> 52#include <asm/ia32.h>
53#include <asm/idle.h> 53#include <asm/idle.h>
54#include <asm/syscalls.h>
54 55
55asmlinkage extern void ret_from_fork(void); 56asmlinkage extern void ret_from_fork(void);
56 57
@@ -92,30 +93,12 @@ void exit_idle(void)
92 __exit_idle(); 93 __exit_idle();
93} 94}
94 95
95#ifdef CONFIG_HOTPLUG_CPU 96#ifndef CONFIG_SMP
96DECLARE_PER_CPU(int, cpu_state);
97
98#include <asm/nmi.h>
99/* We halt the CPU with physical CPU hotplug */
100static inline void play_dead(void)
101{
102 idle_task_exit();
103 c1e_remove_cpu(raw_smp_processor_id());
104
105 mb();
106 /* Ack it */
107 __get_cpu_var(cpu_state) = CPU_DEAD;
108
109 local_irq_disable();
110 /* mask all interrupts, flush any and all caches, and halt */
111 wbinvd_halt();
112}
113#else
114static inline void play_dead(void) 97static inline void play_dead(void)
115{ 98{
116 BUG(); 99 BUG();
117} 100}
118#endif /* CONFIG_HOTPLUG_CPU */ 101#endif
119 102
120/* 103/*
121 * The idle thread. There's no useful work to be 104 * The idle thread. There's no useful work to be
@@ -160,7 +143,7 @@ void cpu_idle(void)
160} 143}
161 144
162/* Prints also some state that isn't saved in the pt_regs */ 145/* Prints also some state that isn't saved in the pt_regs */
163void __show_regs(struct pt_regs * regs) 146void __show_regs(struct pt_regs *regs, int all)
164{ 147{
165 unsigned long cr0 = 0L, cr2 = 0L, cr3 = 0L, cr4 = 0L, fs, gs, shadowgs; 148 unsigned long cr0 = 0L, cr2 = 0L, cr3 = 0L, cr4 = 0L, fs, gs, shadowgs;
166 unsigned long d0, d1, d2, d3, d6, d7; 149 unsigned long d0, d1, d2, d3, d6, d7;
@@ -169,60 +152,65 @@ void __show_regs(struct pt_regs * regs)
169 152
170 printk("\n"); 153 printk("\n");
171 print_modules(); 154 print_modules();
172 printk("Pid: %d, comm: %.20s %s %s %.*s\n", 155 printk(KERN_INFO "Pid: %d, comm: %.20s %s %s %.*s\n",
173 current->pid, current->comm, print_tainted(), 156 current->pid, current->comm, print_tainted(),
174 init_utsname()->release, 157 init_utsname()->release,
175 (int)strcspn(init_utsname()->version, " "), 158 (int)strcspn(init_utsname()->version, " "),
176 init_utsname()->version); 159 init_utsname()->version);
177 printk("RIP: %04lx:[<%016lx>] ", regs->cs & 0xffff, regs->ip); 160 printk(KERN_INFO "RIP: %04lx:[<%016lx>] ", regs->cs & 0xffff, regs->ip);
178 printk_address(regs->ip, 1); 161 printk_address(regs->ip, 1);
179 printk("RSP: %04lx:%016lx EFLAGS: %08lx\n", regs->ss, regs->sp, 162 printk(KERN_INFO "RSP: %04lx:%016lx EFLAGS: %08lx\n", regs->ss,
180 regs->flags); 163 regs->sp, regs->flags);
181 printk("RAX: %016lx RBX: %016lx RCX: %016lx\n", 164 printk(KERN_INFO "RAX: %016lx RBX: %016lx RCX: %016lx\n",
182 regs->ax, regs->bx, regs->cx); 165 regs->ax, regs->bx, regs->cx);
183 printk("RDX: %016lx RSI: %016lx RDI: %016lx\n", 166 printk(KERN_INFO "RDX: %016lx RSI: %016lx RDI: %016lx\n",
184 regs->dx, regs->si, regs->di); 167 regs->dx, regs->si, regs->di);
185 printk("RBP: %016lx R08: %016lx R09: %016lx\n", 168 printk(KERN_INFO "RBP: %016lx R08: %016lx R09: %016lx\n",
186 regs->bp, regs->r8, regs->r9); 169 regs->bp, regs->r8, regs->r9);
187 printk("R10: %016lx R11: %016lx R12: %016lx\n", 170 printk(KERN_INFO "R10: %016lx R11: %016lx R12: %016lx\n",
188 regs->r10, regs->r11, regs->r12); 171 regs->r10, regs->r11, regs->r12);
189 printk("R13: %016lx R14: %016lx R15: %016lx\n", 172 printk(KERN_INFO "R13: %016lx R14: %016lx R15: %016lx\n",
190 regs->r13, regs->r14, regs->r15); 173 regs->r13, regs->r14, regs->r15);
191 174
192 asm("movl %%ds,%0" : "=r" (ds)); 175 asm("movl %%ds,%0" : "=r" (ds));
193 asm("movl %%cs,%0" : "=r" (cs)); 176 asm("movl %%cs,%0" : "=r" (cs));
194 asm("movl %%es,%0" : "=r" (es)); 177 asm("movl %%es,%0" : "=r" (es));
195 asm("movl %%fs,%0" : "=r" (fsindex)); 178 asm("movl %%fs,%0" : "=r" (fsindex));
196 asm("movl %%gs,%0" : "=r" (gsindex)); 179 asm("movl %%gs,%0" : "=r" (gsindex));
197 180
198 rdmsrl(MSR_FS_BASE, fs); 181 rdmsrl(MSR_FS_BASE, fs);
199 rdmsrl(MSR_GS_BASE, gs); 182 rdmsrl(MSR_GS_BASE, gs);
200 rdmsrl(MSR_KERNEL_GS_BASE, shadowgs); 183 rdmsrl(MSR_KERNEL_GS_BASE, shadowgs);
184
185 if (!all)
186 return;
201 187
202 cr0 = read_cr0(); 188 cr0 = read_cr0();
203 cr2 = read_cr2(); 189 cr2 = read_cr2();
204 cr3 = read_cr3(); 190 cr3 = read_cr3();
205 cr4 = read_cr4(); 191 cr4 = read_cr4();
206 192
207 printk("FS: %016lx(%04x) GS:%016lx(%04x) knlGS:%016lx\n", 193 printk(KERN_INFO "FS: %016lx(%04x) GS:%016lx(%04x) knlGS:%016lx\n",
208 fs,fsindex,gs,gsindex,shadowgs); 194 fs, fsindex, gs, gsindex, shadowgs);
209 printk("CS: %04x DS: %04x ES: %04x CR0: %016lx\n", cs, ds, es, cr0); 195 printk(KERN_INFO "CS: %04x DS: %04x ES: %04x CR0: %016lx\n", cs, ds,
210 printk("CR2: %016lx CR3: %016lx CR4: %016lx\n", cr2, cr3, cr4); 196 es, cr0);
197 printk(KERN_INFO "CR2: %016lx CR3: %016lx CR4: %016lx\n", cr2, cr3,
198 cr4);
211 199
212 get_debugreg(d0, 0); 200 get_debugreg(d0, 0);
213 get_debugreg(d1, 1); 201 get_debugreg(d1, 1);
214 get_debugreg(d2, 2); 202 get_debugreg(d2, 2);
215 printk("DR0: %016lx DR1: %016lx DR2: %016lx\n", d0, d1, d2); 203 printk(KERN_INFO "DR0: %016lx DR1: %016lx DR2: %016lx\n", d0, d1, d2);
216 get_debugreg(d3, 3); 204 get_debugreg(d3, 3);
217 get_debugreg(d6, 6); 205 get_debugreg(d6, 6);
218 get_debugreg(d7, 7); 206 get_debugreg(d7, 7);
219 printk("DR3: %016lx DR6: %016lx DR7: %016lx\n", d3, d6, d7); 207 printk(KERN_INFO "DR3: %016lx DR6: %016lx DR7: %016lx\n", d3, d6, d7);
220} 208}
221 209
222void show_regs(struct pt_regs *regs) 210void show_regs(struct pt_regs *regs)
223{ 211{
224 printk("CPU %d:", smp_processor_id()); 212 printk(KERN_INFO "CPU %d:", smp_processor_id());
225 __show_regs(regs); 213 __show_regs(regs, 1);
226 show_trace(NULL, regs, (void *)(regs + 1), regs->bp); 214 show_trace(NULL, regs, (void *)(regs + 1), regs->bp);
227} 215}
228 216
@@ -247,6 +235,14 @@ void exit_thread(void)
247 t->io_bitmap_max = 0; 235 t->io_bitmap_max = 0;
248 put_cpu(); 236 put_cpu();
249 } 237 }
238#ifdef CONFIG_X86_DS
239 /* Free any DS contexts that have not been properly released. */
240 if (unlikely(t->ds_ctx)) {
241 /* we clear debugctl to make sure DS is not used. */
242 update_debugctlmsr(0);
243 ds_free(t->ds_ctx);
244 }
245#endif /* CONFIG_X86_DS */
250} 246}
251 247
252void flush_thread(void) 248void flush_thread(void)
@@ -322,10 +318,10 @@ void prepare_to_copy(struct task_struct *tsk)
322 318
323int copy_thread(int nr, unsigned long clone_flags, unsigned long sp, 319int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
324 unsigned long unused, 320 unsigned long unused,
325 struct task_struct * p, struct pt_regs * regs) 321 struct task_struct *p, struct pt_regs *regs)
326{ 322{
327 int err; 323 int err;
328 struct pt_regs * childregs; 324 struct pt_regs *childregs;
329 struct task_struct *me = current; 325 struct task_struct *me = current;
330 326
331 childregs = ((struct pt_regs *) 327 childregs = ((struct pt_regs *)
@@ -370,10 +366,10 @@ int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
370 if (test_thread_flag(TIF_IA32)) 366 if (test_thread_flag(TIF_IA32))
371 err = do_set_thread_area(p, -1, 367 err = do_set_thread_area(p, -1,
372 (struct user_desc __user *)childregs->si, 0); 368 (struct user_desc __user *)childregs->si, 0);
373 else 369 else
374#endif 370#endif
375 err = do_arch_prctl(p, ARCH_SET_FS, childregs->r8); 371 err = do_arch_prctl(p, ARCH_SET_FS, childregs->r8);
376 if (err) 372 if (err)
377 goto out; 373 goto out;
378 } 374 }
379 err = 0; 375 err = 0;
@@ -480,13 +476,27 @@ static inline void __switch_to_xtra(struct task_struct *prev_p,
480 next = &next_p->thread; 476 next = &next_p->thread;
481 477
482 debugctl = prev->debugctlmsr; 478 debugctl = prev->debugctlmsr;
483 if (next->ds_area_msr != prev->ds_area_msr) { 479
484 /* we clear debugctl to make sure DS 480#ifdef CONFIG_X86_DS
485 * is not in use when we change it */ 481 {
486 debugctl = 0; 482 unsigned long ds_prev = 0, ds_next = 0;
487 update_debugctlmsr(0); 483
488 wrmsrl(MSR_IA32_DS_AREA, next->ds_area_msr); 484 if (prev->ds_ctx)
485 ds_prev = (unsigned long)prev->ds_ctx->ds;
486 if (next->ds_ctx)
487 ds_next = (unsigned long)next->ds_ctx->ds;
488
489 if (ds_next != ds_prev) {
490 /*
491 * We clear debugctl to make sure DS
492 * is not in use when we change it:
493 */
494 debugctl = 0;
495 update_debugctlmsr(0);
496 wrmsrl(MSR_IA32_DS_AREA, ds_next);
497 }
489 } 498 }
499#endif /* CONFIG_X86_DS */
490 500
491 if (next->debugctlmsr != debugctl) 501 if (next->debugctlmsr != debugctl)
492 update_debugctlmsr(next->debugctlmsr); 502 update_debugctlmsr(next->debugctlmsr);
@@ -524,13 +534,13 @@ static inline void __switch_to_xtra(struct task_struct *prev_p,
524 memset(tss->io_bitmap, 0xff, prev->io_bitmap_max); 534 memset(tss->io_bitmap, 0xff, prev->io_bitmap_max);
525 } 535 }
526 536
527#ifdef X86_BTS 537#ifdef CONFIG_X86_PTRACE_BTS
528 if (test_tsk_thread_flag(prev_p, TIF_BTS_TRACE_TS)) 538 if (test_tsk_thread_flag(prev_p, TIF_BTS_TRACE_TS))
529 ptrace_bts_take_timestamp(prev_p, BTS_TASK_DEPARTS); 539 ptrace_bts_take_timestamp(prev_p, BTS_TASK_DEPARTS);
530 540
531 if (test_tsk_thread_flag(next_p, TIF_BTS_TRACE_TS)) 541 if (test_tsk_thread_flag(next_p, TIF_BTS_TRACE_TS))
532 ptrace_bts_take_timestamp(next_p, BTS_TASK_ARRIVES); 542 ptrace_bts_take_timestamp(next_p, BTS_TASK_ARRIVES);
533#endif 543#endif /* CONFIG_X86_PTRACE_BTS */
534} 544}
535 545
536/* 546/*
@@ -552,7 +562,7 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
552 unsigned fsindex, gsindex; 562 unsigned fsindex, gsindex;
553 563
554 /* we're going to use this soon, after a few expensive things */ 564 /* we're going to use this soon, after a few expensive things */
555 if (next_p->fpu_counter>5) 565 if (next_p->fpu_counter > 5)
556 prefetch(next->xstate); 566 prefetch(next->xstate);
557 567
558 /* 568 /*
@@ -560,13 +570,13 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
560 */ 570 */
561 load_sp0(tss, next); 571 load_sp0(tss, next);
562 572
563 /* 573 /*
564 * Switch DS and ES. 574 * Switch DS and ES.
565 * This won't pick up thread selector changes, but I guess that is ok. 575 * This won't pick up thread selector changes, but I guess that is ok.
566 */ 576 */
567 savesegment(es, prev->es); 577 savesegment(es, prev->es);
568 if (unlikely(next->es | prev->es)) 578 if (unlikely(next->es | prev->es))
569 loadsegment(es, next->es); 579 loadsegment(es, next->es);
570 580
571 savesegment(ds, prev->ds); 581 savesegment(ds, prev->ds);
572 if (unlikely(next->ds | prev->ds)) 582 if (unlikely(next->ds | prev->ds))
@@ -592,7 +602,7 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
592 */ 602 */
593 arch_leave_lazy_cpu_mode(); 603 arch_leave_lazy_cpu_mode();
594 604
595 /* 605 /*
596 * Switch FS and GS. 606 * Switch FS and GS.
597 * 607 *
598 * Segment register != 0 always requires a reload. Also 608 * Segment register != 0 always requires a reload. Also
@@ -601,13 +611,13 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
601 */ 611 */
602 if (unlikely(fsindex | next->fsindex | prev->fs)) { 612 if (unlikely(fsindex | next->fsindex | prev->fs)) {
603 loadsegment(fs, next->fsindex); 613 loadsegment(fs, next->fsindex);
604 /* 614 /*
605 * Check if the user used a selector != 0; if yes 615 * Check if the user used a selector != 0; if yes
606 * clear 64bit base, since overloaded base is always 616 * clear 64bit base, since overloaded base is always
607 * mapped to the Null selector 617 * mapped to the Null selector
608 */ 618 */
609 if (fsindex) 619 if (fsindex)
610 prev->fs = 0; 620 prev->fs = 0;
611 } 621 }
612 /* when next process has a 64bit base use it */ 622 /* when next process has a 64bit base use it */
613 if (next->fs) 623 if (next->fs)
@@ -617,7 +627,7 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
617 if (unlikely(gsindex | next->gsindex | prev->gs)) { 627 if (unlikely(gsindex | next->gsindex | prev->gs)) {
618 load_gs_index(next->gsindex); 628 load_gs_index(next->gsindex);
619 if (gsindex) 629 if (gsindex)
620 prev->gs = 0; 630 prev->gs = 0;
621 } 631 }
622 if (next->gs) 632 if (next->gs)
623 wrmsrl(MSR_KERNEL_GS_BASE, next->gs); 633 wrmsrl(MSR_KERNEL_GS_BASE, next->gs);
@@ -626,12 +636,12 @@ __switch_to(struct task_struct *prev_p, struct task_struct *next_p)
626 /* Must be after DS reload */ 636 /* Must be after DS reload */
627 unlazy_fpu(prev_p); 637 unlazy_fpu(prev_p);
628 638
629 /* 639 /*
630 * Switch the PDA and FPU contexts. 640 * Switch the PDA and FPU contexts.
631 */ 641 */
632 prev->usersp = read_pda(oldrsp); 642 prev->usersp = read_pda(oldrsp);
633 write_pda(oldrsp, next->usersp); 643 write_pda(oldrsp, next->usersp);
634 write_pda(pcurrent, next_p); 644 write_pda(pcurrent, next_p);
635 645
636 write_pda(kernelstack, 646 write_pda(kernelstack,
637 (unsigned long)task_stack_page(next_p) + 647 (unsigned long)task_stack_page(next_p) +
@@ -672,7 +682,7 @@ long sys_execve(char __user *name, char __user * __user *argv,
672 char __user * __user *envp, struct pt_regs *regs) 682 char __user * __user *envp, struct pt_regs *regs)
673{ 683{
674 long error; 684 long error;
675 char * filename; 685 char *filename;
676 686
677 filename = getname(name); 687 filename = getname(name);
678 error = PTR_ERR(filename); 688 error = PTR_ERR(filename);
@@ -730,55 +740,55 @@ asmlinkage long sys_vfork(struct pt_regs *regs)
730unsigned long get_wchan(struct task_struct *p) 740unsigned long get_wchan(struct task_struct *p)
731{ 741{
732 unsigned long stack; 742 unsigned long stack;
733 u64 fp,ip; 743 u64 fp, ip;
734 int count = 0; 744 int count = 0;
735 745
736 if (!p || p == current || p->state==TASK_RUNNING) 746 if (!p || p == current || p->state == TASK_RUNNING)
737 return 0; 747 return 0;
738 stack = (unsigned long)task_stack_page(p); 748 stack = (unsigned long)task_stack_page(p);
739 if (p->thread.sp < stack || p->thread.sp > stack+THREAD_SIZE) 749 if (p->thread.sp < stack || p->thread.sp >= stack+THREAD_SIZE)
740 return 0; 750 return 0;
741 fp = *(u64 *)(p->thread.sp); 751 fp = *(u64 *)(p->thread.sp);
742 do { 752 do {
743 if (fp < (unsigned long)stack || 753 if (fp < (unsigned long)stack ||
744 fp > (unsigned long)stack+THREAD_SIZE) 754 fp >= (unsigned long)stack+THREAD_SIZE)
745 return 0; 755 return 0;
746 ip = *(u64 *)(fp+8); 756 ip = *(u64 *)(fp+8);
747 if (!in_sched_functions(ip)) 757 if (!in_sched_functions(ip))
748 return ip; 758 return ip;
749 fp = *(u64 *)fp; 759 fp = *(u64 *)fp;
750 } while (count++ < 16); 760 } while (count++ < 16);
751 return 0; 761 return 0;
752} 762}
753 763
754long do_arch_prctl(struct task_struct *task, int code, unsigned long addr) 764long do_arch_prctl(struct task_struct *task, int code, unsigned long addr)
755{ 765{
756 int ret = 0; 766 int ret = 0;
757 int doit = task == current; 767 int doit = task == current;
758 int cpu; 768 int cpu;
759 769
760 switch (code) { 770 switch (code) {
761 case ARCH_SET_GS: 771 case ARCH_SET_GS:
762 if (addr >= TASK_SIZE_OF(task)) 772 if (addr >= TASK_SIZE_OF(task))
763 return -EPERM; 773 return -EPERM;
764 cpu = get_cpu(); 774 cpu = get_cpu();
765 /* handle small bases via the GDT because that's faster to 775 /* handle small bases via the GDT because that's faster to
766 switch. */ 776 switch. */
767 if (addr <= 0xffffffff) { 777 if (addr <= 0xffffffff) {
768 set_32bit_tls(task, GS_TLS, addr); 778 set_32bit_tls(task, GS_TLS, addr);
769 if (doit) { 779 if (doit) {
770 load_TLS(&task->thread, cpu); 780 load_TLS(&task->thread, cpu);
771 load_gs_index(GS_TLS_SEL); 781 load_gs_index(GS_TLS_SEL);
772 } 782 }
773 task->thread.gsindex = GS_TLS_SEL; 783 task->thread.gsindex = GS_TLS_SEL;
774 task->thread.gs = 0; 784 task->thread.gs = 0;
775 } else { 785 } else {
776 task->thread.gsindex = 0; 786 task->thread.gsindex = 0;
777 task->thread.gs = addr; 787 task->thread.gs = addr;
778 if (doit) { 788 if (doit) {
779 load_gs_index(0); 789 load_gs_index(0);
780 ret = checking_wrmsrl(MSR_KERNEL_GS_BASE, addr); 790 ret = checking_wrmsrl(MSR_KERNEL_GS_BASE, addr);
781 } 791 }
782 } 792 }
783 put_cpu(); 793 put_cpu();
784 break; 794 break;
@@ -832,8 +842,7 @@ long do_arch_prctl(struct task_struct *task, int code, unsigned long addr)
832 rdmsrl(MSR_KERNEL_GS_BASE, base); 842 rdmsrl(MSR_KERNEL_GS_BASE, base);
833 else 843 else
834 base = task->thread.gs; 844 base = task->thread.gs;
835 } 845 } else
836 else
837 base = task->thread.gs; 846 base = task->thread.gs;
838 ret = put_user(base, (unsigned long __user *)addr); 847 ret = put_user(base, (unsigned long __user *)addr);
839 break; 848 break;