]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - arch/x86/kernel/process_64.c
Merge branch 'upstream-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/jgarzi...
[mirror_ubuntu-artful-kernel.git] / arch / x86 / kernel / process_64.c
CommitLineData
1da177e4 1/*
1da177e4
LT
2 * Copyright (C) 1995 Linus Torvalds
3 *
4 * Pentium III FXSR, SSE support
5 * Gareth Hughes <gareth@valinux.com>, May 2000
6612538c 6 *
1da177e4
LT
7 * X86-64 port
8 * Andi Kleen.
76e4f660
AR
9 *
10 * CPU hotplug support - ashok.raj@intel.com
1da177e4
LT
11 */
12
13/*
14 * This file handles the architecture-dependent parts of process handling..
15 */
16
42059429 17#include <linux/stackprotector.h>
76e4f660 18#include <linux/cpu.h>
1da177e4
LT
19#include <linux/errno.h>
20#include <linux/sched.h>
6612538c 21#include <linux/fs.h>
1da177e4
LT
22#include <linux/kernel.h>
23#include <linux/mm.h>
24#include <linux/elfcore.h>
25#include <linux/smp.h>
26#include <linux/slab.h>
27#include <linux/user.h>
1da177e4 28#include <linux/interrupt.h>
6612538c 29#include <linux/utsname.h>
1da177e4 30#include <linux/delay.h>
6612538c 31#include <linux/module.h>
1da177e4 32#include <linux/ptrace.h>
95833c83 33#include <linux/notifier.h>
c6fd91f0 34#include <linux/kprobes.h>
1eeb66a1 35#include <linux/kdebug.h>
02290683 36#include <linux/tick.h>
529e25f6 37#include <linux/prctl.h>
7de08b4e
GP
38#include <linux/uaccess.h>
39#include <linux/io.h>
8b96f011 40#include <linux/ftrace.h>
48ec4d95 41#include <linux/dmi.h>
1da177e4 42
1da177e4
LT
43#include <asm/pgtable.h>
44#include <asm/system.h>
1da177e4
LT
45#include <asm/processor.h>
46#include <asm/i387.h>
47#include <asm/mmu_context.h>
1da177e4 48#include <asm/prctl.h>
1da177e4
LT
49#include <asm/desc.h>
50#include <asm/proto.h>
51#include <asm/ia32.h>
95833c83 52#include <asm/idle.h>
bbc1f698 53#include <asm/syscalls.h>
bf53de90 54#include <asm/ds.h>
1da177e4
LT
55
56asmlinkage extern void ret_from_fork(void);
57
3d1e42a7 58DEFINE_PER_CPU(unsigned long, old_rsp);
c2558e0e 59static DEFINE_PER_CPU(unsigned char, is_idle);
3d1e42a7 60
1da177e4
LT
61unsigned long kernel_thread_flags = CLONE_VM | CLONE_UNTRACED;
62
e041c683 63static ATOMIC_NOTIFIER_HEAD(idle_notifier);
95833c83
AK
64
65void idle_notifier_register(struct notifier_block *n)
66{
e041c683 67 atomic_notifier_chain_register(&idle_notifier, n);
95833c83 68}
c7d87d79
VP
69EXPORT_SYMBOL_GPL(idle_notifier_register);
70
71void idle_notifier_unregister(struct notifier_block *n)
72{
73 atomic_notifier_chain_unregister(&idle_notifier, n);
74}
75EXPORT_SYMBOL_GPL(idle_notifier_unregister);
95833c83 76
95833c83
AK
77void enter_idle(void)
78{
c2558e0e 79 percpu_write(is_idle, 1);
e041c683 80 atomic_notifier_call_chain(&idle_notifier, IDLE_START, NULL);
95833c83
AK
81}
82
83static void __exit_idle(void)
84{
c2558e0e 85 if (x86_test_and_clear_bit_percpu(0, is_idle) == 0)
a15da49d 86 return;
e041c683 87 atomic_notifier_call_chain(&idle_notifier, IDLE_END, NULL);
95833c83
AK
88}
89
90/* Called from interrupts to signify idle end */
91void exit_idle(void)
92{
a15da49d
AK
93 /* idle loop has pid 0 */
94 if (current->pid)
95833c83
AK
95 return;
96 __exit_idle();
97}
98
913da64b 99#ifndef CONFIG_SMP
76e4f660
AR
100static inline void play_dead(void)
101{
102 BUG();
103}
913da64b 104#endif
76e4f660 105
1da177e4
LT
106/*
107 * The idle thread. There's no useful work to be
108 * done, so just try to conserve power and have a
109 * low exit latency (ie sit in a loop waiting for
110 * somebody to say that they'd like to reschedule)
111 */
b10db7f0 112void cpu_idle(void)
1da177e4 113{
495ab9c0 114 current_thread_info()->status |= TS_POLLING;
ce22bd92 115
ce22bd92 116 /*
5c79d2a5
TH
117 * If we're the non-boot CPU, nothing set the stack canary up
118 * for us. CPU0 already has it initialized but no harm in
119 * doing it again. This is a good place for updating it, as
120 * we wont ever return from this function (so the invalid
121 * canaries already on the stack wont ever trigger).
ce22bd92 122 */
18aa8bb1
IM
123 boot_init_stack_canary();
124
1da177e4
LT
125 /* endless idle loop with no priority at all */
126 while (1) {
b8f8c3cf 127 tick_nohz_stop_sched_tick(1);
1da177e4 128 while (!need_resched()) {
1da177e4 129
1da177e4 130 rmb();
6ddd2a27 131
76e4f660
AR
132 if (cpu_is_offline(smp_processor_id()))
133 play_dead();
d331e739
VP
134 /*
135 * Idle routines should keep interrupts disabled
136 * from here on, until they go to idle.
137 * Otherwise, idle callbacks can misfire.
138 */
139 local_irq_disable();
95833c83 140 enter_idle();
81d68a96
SR
141 /* Don't trace irqs off for idle */
142 stop_critical_timings();
6ddd2a27 143 pm_idle();
81d68a96 144 start_critical_timings();
a15da49d
AK
145 /* In many cases the interrupt that ended idle
146 has already called exit_idle. But some idle
147 loops can be woken up without interrupt. */
95833c83 148 __exit_idle();
1da177e4
LT
149 }
150
02290683 151 tick_nohz_restart_sched_tick();
5bfb5d69 152 preempt_enable_no_resched();
1da177e4 153 schedule();
5bfb5d69 154 preempt_disable();
1da177e4
LT
155 }
156}
157
6612538c 158/* Prints also some state that isn't saved in the pt_regs */
e2ce07c8 159void __show_regs(struct pt_regs *regs, int all)
1da177e4
LT
160{
161 unsigned long cr0 = 0L, cr2 = 0L, cr3 = 0L, cr4 = 0L, fs, gs, shadowgs;
bb1995d5 162 unsigned long d0, d1, d2, d3, d6, d7;
6612538c
HS
163 unsigned int fsindex, gsindex;
164 unsigned int ds, cs, es;
48ec4d95 165 const char *board;
1da177e4
LT
166
167 printk("\n");
168 print_modules();
48ec4d95
KM
169 board = dmi_get_system_info(DMI_PRODUCT_NAME);
170 if (!board)
171 board = "";
172 printk(KERN_INFO "Pid: %d, comm: %.20s %s %s %.*s %s\n",
9acf23c4 173 current->pid, current->comm, print_tainted(),
96b644bd
SH
174 init_utsname()->release,
175 (int)strcspn(init_utsname()->version, " "),
48ec4d95 176 init_utsname()->version, board);
8092c654 177 printk(KERN_INFO "RIP: %04lx:[<%016lx>] ", regs->cs & 0xffff, regs->ip);
aafbd7eb 178 printk_address(regs->ip, 1);
8092c654
GP
179 printk(KERN_INFO "RSP: %04lx:%016lx EFLAGS: %08lx\n", regs->ss,
180 regs->sp, regs->flags);
181 printk(KERN_INFO "RAX: %016lx RBX: %016lx RCX: %016lx\n",
65ea5b03 182 regs->ax, regs->bx, regs->cx);
8092c654 183 printk(KERN_INFO "RDX: %016lx RSI: %016lx RDI: %016lx\n",
65ea5b03 184 regs->dx, regs->si, regs->di);
8092c654 185 printk(KERN_INFO "RBP: %016lx R08: %016lx R09: %016lx\n",
65ea5b03 186 regs->bp, regs->r8, regs->r9);
8092c654 187 printk(KERN_INFO "R10: %016lx R11: %016lx R12: %016lx\n",
7de08b4e 188 regs->r10, regs->r11, regs->r12);
8092c654 189 printk(KERN_INFO "R13: %016lx R14: %016lx R15: %016lx\n",
7de08b4e 190 regs->r13, regs->r14, regs->r15);
1da177e4 191
7de08b4e
GP
192 asm("movl %%ds,%0" : "=r" (ds));
193 asm("movl %%cs,%0" : "=r" (cs));
194 asm("movl %%es,%0" : "=r" (es));
1da177e4
LT
195 asm("movl %%fs,%0" : "=r" (fsindex));
196 asm("movl %%gs,%0" : "=r" (gsindex));
197
198 rdmsrl(MSR_FS_BASE, fs);
7de08b4e
GP
199 rdmsrl(MSR_GS_BASE, gs);
200 rdmsrl(MSR_KERNEL_GS_BASE, shadowgs);
1da177e4 201
e2ce07c8
PE
202 if (!all)
203 return;
1da177e4 204
f51c9452
GOC
205 cr0 = read_cr0();
206 cr2 = read_cr2();
207 cr3 = read_cr3();
208 cr4 = read_cr4();
1da177e4 209
8092c654 210 printk(KERN_INFO "FS: %016lx(%04x) GS:%016lx(%04x) knlGS:%016lx\n",
7de08b4e 211 fs, fsindex, gs, gsindex, shadowgs);
8092c654
GP
212 printk(KERN_INFO "CS: %04x DS: %04x ES: %04x CR0: %016lx\n", cs, ds,
213 es, cr0);
214 printk(KERN_INFO "CR2: %016lx CR3: %016lx CR4: %016lx\n", cr2, cr3,
215 cr4);
bb1995d5
AS
216
217 get_debugreg(d0, 0);
218 get_debugreg(d1, 1);
219 get_debugreg(d2, 2);
8092c654 220 printk(KERN_INFO "DR0: %016lx DR1: %016lx DR2: %016lx\n", d0, d1, d2);
bb1995d5
AS
221 get_debugreg(d3, 3);
222 get_debugreg(d6, 6);
223 get_debugreg(d7, 7);
8092c654 224 printk(KERN_INFO "DR3: %016lx DR6: %016lx DR7: %016lx\n", d3, d6, d7);
1da177e4
LT
225}
226
227void show_regs(struct pt_regs *regs)
228{
8092c654 229 printk(KERN_INFO "CPU %d:", smp_processor_id());
e2ce07c8 230 __show_regs(regs, 1);
bc850d6b 231 show_trace(NULL, regs, (void *)(regs + 1), regs->bp);
1da177e4
LT
232}
233
1da177e4
LT
234void release_thread(struct task_struct *dead_task)
235{
236 if (dead_task->mm) {
237 if (dead_task->mm->context.size) {
238 printk("WARNING: dead process %8s still has LDT? <%p/%d>\n",
239 dead_task->comm,
240 dead_task->mm->context.ldt,
241 dead_task->mm->context.size);
242 BUG();
243 }
244 }
245}
246
247static inline void set_32bit_tls(struct task_struct *t, int tls, u32 addr)
248{
6612538c 249 struct user_desc ud = {
1da177e4
LT
250 .base_addr = addr,
251 .limit = 0xfffff,
252 .seg_32bit = 1,
253 .limit_in_pages = 1,
254 .useable = 1,
255 };
ade1af77 256 struct desc_struct *desc = t->thread.tls_array;
1da177e4 257 desc += tls;
80fbb69a 258 fill_ldt(desc, &ud);
1da177e4
LT
259}
260
261static inline u32 read_32bit_tls(struct task_struct *t, int tls)
262{
91394eb0 263 return get_desc_base(&t->thread.tls_array[tls]);
1da177e4
LT
264}
265
266/*
267 * This gets called before we allocate a new thread and copy
268 * the current task into it.
269 */
270void prepare_to_copy(struct task_struct *tsk)
271{
272 unlazy_fpu(tsk);
273}
274
6f2c55b8 275int copy_thread(unsigned long clone_flags, unsigned long sp,
1da177e4 276 unsigned long unused,
7de08b4e 277 struct task_struct *p, struct pt_regs *regs)
1da177e4
LT
278{
279 int err;
7de08b4e 280 struct pt_regs *childregs;
1da177e4
LT
281 struct task_struct *me = current;
282
a88cde13 283 childregs = ((struct pt_regs *)
57eafdc2 284 (THREAD_SIZE + task_stack_page(p))) - 1;
1da177e4
LT
285 *childregs = *regs;
286
65ea5b03
PA
287 childregs->ax = 0;
288 childregs->sp = sp;
289 if (sp == ~0UL)
290 childregs->sp = (unsigned long)childregs;
1da177e4 291
faca6227
PA
292 p->thread.sp = (unsigned long) childregs;
293 p->thread.sp0 = (unsigned long) (childregs+1);
294 p->thread.usersp = me->thread.usersp;
1da177e4 295
e4f17c43 296 set_tsk_thread_flag(p, TIF_FORK);
1da177e4
LT
297
298 p->thread.fs = me->thread.fs;
299 p->thread.gs = me->thread.gs;
300
ada85708
JF
301 savesegment(gs, p->thread.gsindex);
302 savesegment(fs, p->thread.fsindex);
303 savesegment(es, p->thread.es);
304 savesegment(ds, p->thread.ds);
1da177e4 305
d3a4f48d 306 if (unlikely(test_tsk_thread_flag(me, TIF_IO_BITMAP))) {
1da177e4
LT
307 p->thread.io_bitmap_ptr = kmalloc(IO_BITMAP_BYTES, GFP_KERNEL);
308 if (!p->thread.io_bitmap_ptr) {
309 p->thread.io_bitmap_max = 0;
310 return -ENOMEM;
311 }
a88cde13
AK
312 memcpy(p->thread.io_bitmap_ptr, me->thread.io_bitmap_ptr,
313 IO_BITMAP_BYTES);
d3a4f48d 314 set_tsk_thread_flag(p, TIF_IO_BITMAP);
6612538c 315 }
1da177e4
LT
316
317 /*
318 * Set a new TLS for the child thread?
319 */
320 if (clone_flags & CLONE_SETTLS) {
321#ifdef CONFIG_IA32_EMULATION
322 if (test_thread_flag(TIF_IA32))
efd1ca52 323 err = do_set_thread_area(p, -1,
65ea5b03 324 (struct user_desc __user *)childregs->si, 0);
7de08b4e
GP
325 else
326#endif
327 err = do_arch_prctl(p, ARCH_SET_FS, childregs->r8);
328 if (err)
1da177e4
LT
329 goto out;
330 }
bf53de90 331
2311f0de
MM
332 clear_tsk_thread_flag(p, TIF_DS_AREA_MSR);
333 p->thread.ds_ctx = NULL;
bf53de90
MM
334
335 clear_tsk_thread_flag(p, TIF_DEBUGCTLMSR);
336 p->thread.debugctlmsr = 0;
337
1da177e4
LT
338 err = 0;
339out:
340 if (err && p->thread.io_bitmap_ptr) {
341 kfree(p->thread.io_bitmap_ptr);
342 p->thread.io_bitmap_max = 0;
343 }
344 return err;
345}
346
513ad84b
IM
347void
348start_thread(struct pt_regs *regs, unsigned long new_ip, unsigned long new_sp)
349{
ada85708
JF
350 loadsegment(fs, 0);
351 loadsegment(es, 0);
352 loadsegment(ds, 0);
513ad84b
IM
353 load_gs_index(0);
354 regs->ip = new_ip;
355 regs->sp = new_sp;
3d1e42a7 356 percpu_write(old_rsp, new_sp);
513ad84b
IM
357 regs->cs = __USER_CS;
358 regs->ss = __USER_DS;
359 regs->flags = 0x200;
360 set_fs(USER_DS);
aa283f49
SS
361 /*
362 * Free the old FP and other extended state
363 */
364 free_thread_xstate(current);
513ad84b
IM
365}
366EXPORT_SYMBOL_GPL(start_thread);
367
1da177e4
LT
368/*
369 * switch_to(x,y) should switch tasks from x to y.
370 *
6612538c 371 * This could still be optimized:
1da177e4
LT
372 * - fold all the options into a flag word and test it with a single test.
373 * - could test fs/gs bitsliced
099f318b
AK
374 *
375 * Kprobes not supported here. Set the probe on schedule instead.
8b96f011 376 * Function graph tracer not supported too.
1da177e4 377 */
8b96f011 378__notrace_funcgraph struct task_struct *
a88cde13 379__switch_to(struct task_struct *prev_p, struct task_struct *next_p)
1da177e4 380{
87b935a0
JF
381 struct thread_struct *prev = &prev_p->thread;
382 struct thread_struct *next = &next_p->thread;
6612538c 383 int cpu = smp_processor_id();
1da177e4 384 struct tss_struct *tss = &per_cpu(init_tss, cpu);
478de5a9 385 unsigned fsindex, gsindex;
17950c5b
JF
386 bool preload_fpu;
387
388 /*
389 * If the task has used fpu the last 5 timeslices, just do a full
390 * restore of the math state immediately to avoid the trap; the
391 * chances of needing FPU soon are obviously high now
392 */
393 preload_fpu = tsk_used_math(next_p) && next_p->fpu_counter > 5;
1da177e4 394
e07e23e1 395 /* we're going to use this soon, after a few expensive things */
17950c5b 396 if (preload_fpu)
61c4628b 397 prefetch(next->xstate);
e07e23e1 398
1da177e4
LT
399 /*
400 * Reload esp0, LDT and the page table pointer:
401 */
7818a1e0 402 load_sp0(tss, next);
1da177e4 403
7de08b4e 404 /*
1da177e4
LT
405 * Switch DS and ES.
406 * This won't pick up thread selector changes, but I guess that is ok.
407 */
ada85708 408 savesegment(es, prev->es);
1da177e4 409 if (unlikely(next->es | prev->es))
7de08b4e 410 loadsegment(es, next->es);
ada85708
JF
411
412 savesegment(ds, prev->ds);
1da177e4
LT
413 if (unlikely(next->ds | prev->ds))
414 loadsegment(ds, next->ds);
415
478de5a9
JF
416
417 /* We must save %fs and %gs before load_TLS() because
418 * %fs and %gs may be cleared by load_TLS().
419 *
420 * (e.g. xen_load_tls())
421 */
422 savesegment(fs, fsindex);
423 savesegment(gs, gsindex);
424
1da177e4
LT
425 load_TLS(next, cpu);
426
16d9dbf0
JF
427 /* Must be after DS reload */
428 unlazy_fpu(prev_p);
429
17950c5b
JF
430 /* Make sure cpu is ready for new context */
431 if (preload_fpu)
432 clts();
433
3fe0a63e
JF
434 /*
435 * Leave lazy mode, flushing any hypercalls made here.
436 * This must be done before restoring TLS segments so
437 * the GDT and LDT are properly updated, and must be
438 * done before math_state_restore, so the TS bit is up
439 * to date.
440 */
224101ed 441 arch_end_context_switch(next_p);
3fe0a63e 442
7de08b4e 443 /*
1da177e4 444 * Switch FS and GS.
87b935a0
JF
445 *
446 * Segment register != 0 always requires a reload. Also
447 * reload when it has changed. When prev process used 64bit
448 * base always reload to avoid an information leak.
1da177e4 449 */
87b935a0
JF
450 if (unlikely(fsindex | next->fsindex | prev->fs)) {
451 loadsegment(fs, next->fsindex);
7de08b4e 452 /*
87b935a0
JF
453 * Check if the user used a selector != 0; if yes
454 * clear 64bit base, since overloaded base is always
455 * mapped to the Null selector
456 */
457 if (fsindex)
7de08b4e 458 prev->fs = 0;
1da177e4 459 }
87b935a0
JF
460 /* when next process has a 64bit base use it */
461 if (next->fs)
462 wrmsrl(MSR_FS_BASE, next->fs);
463 prev->fsindex = fsindex;
464
465 if (unlikely(gsindex | next->gsindex | prev->gs)) {
466 load_gs_index(next->gsindex);
467 if (gsindex)
7de08b4e 468 prev->gs = 0;
1da177e4 469 }
87b935a0
JF
470 if (next->gs)
471 wrmsrl(MSR_KERNEL_GS_BASE, next->gs);
472 prev->gsindex = gsindex;
1da177e4 473
7de08b4e 474 /*
45948d77 475 * Switch the PDA and FPU contexts.
1da177e4 476 */
3d1e42a7
BG
477 prev->usersp = percpu_read(old_rsp);
478 percpu_write(old_rsp, next->usersp);
c6f5e0ac 479 percpu_write(current_task, next_p);
18bd057b 480
9af45651 481 percpu_write(kernel_stack,
87b935a0 482 (unsigned long)task_stack_page(next_p) +
9af45651 483 THREAD_SIZE - KERNEL_STACK_OFFSET);
1da177e4
LT
484
485 /*
d3a4f48d 486 * Now maybe reload the debug registers and handle I/O bitmaps
1da177e4 487 */
eee3af4a
MM
488 if (unlikely(task_thread_info(next_p)->flags & _TIF_WORK_CTXSW_NEXT ||
489 task_thread_info(prev_p)->flags & _TIF_WORK_CTXSW_PREV))
d3a4f48d 490 __switch_to_xtra(prev_p, next_p, tss);
1da177e4 491
17950c5b
JF
492 /*
493 * Preload the FPU context, now that we've determined that the
494 * task is likely to be using it.
e07e23e1 495 */
17950c5b
JF
496 if (preload_fpu)
497 __math_state_restore();
1da177e4
LT
498 return prev_p;
499}
500
501/*
502 * sys_execve() executes a new program.
503 */
6612538c 504asmlinkage
1da177e4 505long sys_execve(char __user *name, char __user * __user *argv,
5d119b2c 506 char __user * __user *envp, struct pt_regs *regs)
1da177e4
LT
507{
508 long error;
7de08b4e 509 char *filename;
1da177e4
LT
510
511 filename = getname(name);
512 error = PTR_ERR(filename);
5d119b2c 513 if (IS_ERR(filename))
1da177e4 514 return error;
5d119b2c 515 error = do_execve(filename, argv, envp, regs);
1da177e4
LT
516 putname(filename);
517 return error;
518}
519
520void set_personality_64bit(void)
521{
522 /* inherit personality from parent */
523
524 /* Make sure to be in 64bit mode */
6612538c 525 clear_thread_flag(TIF_IA32);
1da177e4
LT
526
527 /* TBD: overwrites user setup. Should have two bits.
528 But 64bit processes have always behaved this way,
529 so it's not too bad. The main problem is just that
6612538c 530 32bit childs are affected again. */
1da177e4
LT
531 current->personality &= ~READ_IMPLIES_EXEC;
532}
533
a88cde13
AK
534asmlinkage long
535sys_clone(unsigned long clone_flags, unsigned long newsp,
536 void __user *parent_tid, void __user *child_tid, struct pt_regs *regs)
1da177e4
LT
537{
538 if (!newsp)
65ea5b03 539 newsp = regs->sp;
1da177e4
LT
540 return do_fork(clone_flags, newsp, regs, 0, parent_tid, child_tid);
541}
542
1da177e4
LT
543unsigned long get_wchan(struct task_struct *p)
544{
545 unsigned long stack;
7de08b4e 546 u64 fp, ip;
1da177e4
LT
547 int count = 0;
548
7de08b4e
GP
549 if (!p || p == current || p->state == TASK_RUNNING)
550 return 0;
57eafdc2 551 stack = (unsigned long)task_stack_page(p);
e1e23bb0 552 if (p->thread.sp < stack || p->thread.sp >= stack+THREAD_SIZE)
1da177e4 553 return 0;
faca6227 554 fp = *(u64 *)(p->thread.sp);
7de08b4e 555 do {
a88cde13 556 if (fp < (unsigned long)stack ||
e1e23bb0 557 fp >= (unsigned long)stack+THREAD_SIZE)
7de08b4e 558 return 0;
65ea5b03
PA
559 ip = *(u64 *)(fp+8);
560 if (!in_sched_functions(ip))
561 return ip;
7de08b4e
GP
562 fp = *(u64 *)fp;
563 } while (count++ < 16);
1da177e4
LT
564 return 0;
565}
566
567long do_arch_prctl(struct task_struct *task, int code, unsigned long addr)
7de08b4e
GP
568{
569 int ret = 0;
1da177e4
LT
570 int doit = task == current;
571 int cpu;
572
7de08b4e 573 switch (code) {
1da177e4 574 case ARCH_SET_GS:
84929801 575 if (addr >= TASK_SIZE_OF(task))
7de08b4e 576 return -EPERM;
1da177e4 577 cpu = get_cpu();
7de08b4e 578 /* handle small bases via the GDT because that's faster to
1da177e4 579 switch. */
7de08b4e
GP
580 if (addr <= 0xffffffff) {
581 set_32bit_tls(task, GS_TLS, addr);
582 if (doit) {
1da177e4 583 load_TLS(&task->thread, cpu);
7de08b4e 584 load_gs_index(GS_TLS_SEL);
1da177e4 585 }
7de08b4e 586 task->thread.gsindex = GS_TLS_SEL;
1da177e4 587 task->thread.gs = 0;
7de08b4e 588 } else {
1da177e4
LT
589 task->thread.gsindex = 0;
590 task->thread.gs = addr;
591 if (doit) {
a88cde13
AK
592 load_gs_index(0);
593 ret = checking_wrmsrl(MSR_KERNEL_GS_BASE, addr);
7de08b4e 594 }
1da177e4
LT
595 }
596 put_cpu();
597 break;
598 case ARCH_SET_FS:
599 /* Not strictly needed for fs, but do it for symmetry
600 with gs */
84929801 601 if (addr >= TASK_SIZE_OF(task))
6612538c 602 return -EPERM;
1da177e4 603 cpu = get_cpu();
6612538c 604 /* handle small bases via the GDT because that's faster to
1da177e4 605 switch. */
6612538c 606 if (addr <= 0xffffffff) {
1da177e4 607 set_32bit_tls(task, FS_TLS, addr);
6612538c
HS
608 if (doit) {
609 load_TLS(&task->thread, cpu);
ada85708 610 loadsegment(fs, FS_TLS_SEL);
1da177e4
LT
611 }
612 task->thread.fsindex = FS_TLS_SEL;
613 task->thread.fs = 0;
6612538c 614 } else {
1da177e4
LT
615 task->thread.fsindex = 0;
616 task->thread.fs = addr;
617 if (doit) {
618 /* set the selector to 0 to not confuse
619 __switch_to */
ada85708 620 loadsegment(fs, 0);
a88cde13 621 ret = checking_wrmsrl(MSR_FS_BASE, addr);
1da177e4
LT
622 }
623 }
624 put_cpu();
625 break;
6612538c
HS
626 case ARCH_GET_FS: {
627 unsigned long base;
1da177e4
LT
628 if (task->thread.fsindex == FS_TLS_SEL)
629 base = read_32bit_tls(task, FS_TLS);
a88cde13 630 else if (doit)
1da177e4 631 rdmsrl(MSR_FS_BASE, base);
a88cde13 632 else
1da177e4 633 base = task->thread.fs;
6612538c
HS
634 ret = put_user(base, (unsigned long __user *)addr);
635 break;
1da177e4 636 }
6612538c 637 case ARCH_GET_GS: {
1da177e4 638 unsigned long base;
97c2803c 639 unsigned gsindex;
1da177e4
LT
640 if (task->thread.gsindex == GS_TLS_SEL)
641 base = read_32bit_tls(task, GS_TLS);
97c2803c 642 else if (doit) {
ada85708 643 savesegment(gs, gsindex);
97c2803c
JB
644 if (gsindex)
645 rdmsrl(MSR_KERNEL_GS_BASE, base);
646 else
647 base = task->thread.gs;
7de08b4e 648 } else
1da177e4 649 base = task->thread.gs;
6612538c 650 ret = put_user(base, (unsigned long __user *)addr);
1da177e4
LT
651 break;
652 }
653
654 default:
655 ret = -EINVAL;
656 break;
6612538c 657 }
1da177e4 658
6612538c
HS
659 return ret;
660}
1da177e4
LT
661
662long sys_arch_prctl(int code, unsigned long addr)
663{
664 return do_arch_prctl(current, code, addr);
1da177e4
LT
665}
666