]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blob - include/linux/tracehook.h
ptrace: move SIGTRAP on exec(2) logic to ptrace_event()
[mirror_ubuntu-zesty-kernel.git] / include / linux / tracehook.h
1 /*
2 * Tracing hooks
3 *
4 * Copyright (C) 2008-2009 Red Hat, Inc. All rights reserved.
5 *
6 * This copyrighted material is made available to anyone wishing to use,
7 * modify, copy, or redistribute it subject to the terms and conditions
8 * of the GNU General Public License v.2.
9 *
10 * This file defines hook entry points called by core code where
11 * user tracing/debugging support might need to do something. These
12 * entry points are called tracehook_*(). Each hook declared below
13 * has a detailed kerneldoc comment giving the context (locking et
14 * al) from which it is called, and the meaning of its return value.
15 *
16 * Each function here typically has only one call site, so it is ok
17 * to have some nontrivial tracehook_*() inlines. In all cases, the
18 * fast path when no tracing is enabled should be very short.
19 *
20 * The purpose of this file and the tracehook_* layer is to consolidate
21 * the interface that the kernel core and arch code uses to enable any
22 * user debugging or tracing facility (such as ptrace). The interfaces
23 * here are carefully documented so that maintainers of core and arch
24 * code do not need to think about the implementation details of the
25 * tracing facilities. Likewise, maintainers of the tracing code do not
26 * need to understand all the calling core or arch code in detail, just
27 * documented circumstances of each call, such as locking conditions.
28 *
29 * If the calling core code changes so that locking is different, then
30 * it is ok to change the interface documented here. The maintainer of
31 * core code changing should notify the maintainers of the tracing code
32 * that they need to work out the change.
33 *
34 * Some tracehook_*() inlines take arguments that the current tracing
35 * implementations might not necessarily use. These function signatures
36 * are chosen to pass in all the information that is on hand in the
37 * caller and might conceivably be relevant to a tracer, so that the
38 * core code won't have to be updated when tracing adds more features.
39 * If a call site changes so that some of those parameters are no longer
40 * already on hand without extra work, then the tracehook_* interface
41 * can change so there is no make-work burden on the core code. The
42 * maintainer of core code changing should notify the maintainers of the
43 * tracing code that they need to work out the change.
44 */
45
46 #ifndef _LINUX_TRACEHOOK_H
47 #define _LINUX_TRACEHOOK_H 1
48
49 #include <linux/sched.h>
50 #include <linux/ptrace.h>
51 #include <linux/security.h>
52 struct linux_binprm;
53
54 /**
55 * tracehook_expect_breakpoints - guess if task memory might be touched
56 * @task: current task, making a new mapping
57 *
58 * Return nonzero if @task is expected to want breakpoint insertion in
59 * its memory at some point. A zero return is no guarantee it won't
60 * be done, but this is a hint that it's known to be likely.
61 *
62 * May be called with @task->mm->mmap_sem held for writing.
63 */
64 static inline int tracehook_expect_breakpoints(struct task_struct *task)
65 {
66 return (task->ptrace & PT_PTRACED) != 0;
67 }
68
69 /*
70 * ptrace report for syscall entry and exit looks identical.
71 */
72 static inline void ptrace_report_syscall(struct pt_regs *regs)
73 {
74 int ptrace = current->ptrace;
75
76 if (!(ptrace & PT_PTRACED))
77 return;
78
79 ptrace_notify(SIGTRAP | ((ptrace & PT_TRACESYSGOOD) ? 0x80 : 0));
80
81 /*
82 * this isn't the same as continuing with a signal, but it will do
83 * for normal use. strace only continues with a signal if the
84 * stopping signal is not SIGTRAP. -brl
85 */
86 if (current->exit_code) {
87 send_sig(current->exit_code, current, 1);
88 current->exit_code = 0;
89 }
90 }
91
92 /**
93 * tracehook_report_syscall_entry - task is about to attempt a system call
94 * @regs: user register state of current task
95 *
96 * This will be called if %TIF_SYSCALL_TRACE has been set, when the
97 * current task has just entered the kernel for a system call.
98 * Full user register state is available here. Changing the values
99 * in @regs can affect the system call number and arguments to be tried.
100 * It is safe to block here, preventing the system call from beginning.
101 *
102 * Returns zero normally, or nonzero if the calling arch code should abort
103 * the system call. That must prevent normal entry so no system call is
104 * made. If @task ever returns to user mode after this, its register state
105 * is unspecified, but should be something harmless like an %ENOSYS error
106 * return. It should preserve enough information so that syscall_rollback()
107 * can work (see asm-generic/syscall.h).
108 *
109 * Called without locks, just after entering kernel mode.
110 */
111 static inline __must_check int tracehook_report_syscall_entry(
112 struct pt_regs *regs)
113 {
114 ptrace_report_syscall(regs);
115 return 0;
116 }
117
118 /**
119 * tracehook_report_syscall_exit - task has just finished a system call
120 * @regs: user register state of current task
121 * @step: nonzero if simulating single-step or block-step
122 *
123 * This will be called if %TIF_SYSCALL_TRACE has been set, when the
124 * current task has just finished an attempted system call. Full
125 * user register state is available here. It is safe to block here,
126 * preventing signals from being processed.
127 *
128 * If @step is nonzero, this report is also in lieu of the normal
129 * trap that would follow the system call instruction because
130 * user_enable_block_step() or user_enable_single_step() was used.
131 * In this case, %TIF_SYSCALL_TRACE might not be set.
132 *
133 * Called without locks, just before checking for pending signals.
134 */
135 static inline void tracehook_report_syscall_exit(struct pt_regs *regs, int step)
136 {
137 if (step) {
138 siginfo_t info;
139 user_single_step_siginfo(current, regs, &info);
140 force_sig_info(SIGTRAP, &info, current);
141 return;
142 }
143
144 ptrace_report_syscall(regs);
145 }
146
147 /**
148 * tracehook_unsafe_exec - check for exec declared unsafe due to tracing
149 * @task: current task doing exec
150 *
151 * Return %LSM_UNSAFE_* bits applied to an exec because of tracing.
152 *
153 * @task->signal->cred_guard_mutex is held by the caller through the do_execve().
154 */
155 static inline int tracehook_unsafe_exec(struct task_struct *task)
156 {
157 int unsafe = 0;
158 int ptrace = task->ptrace;
159 if (ptrace & PT_PTRACED) {
160 if (ptrace & PT_PTRACE_CAP)
161 unsafe |= LSM_UNSAFE_PTRACE_CAP;
162 else
163 unsafe |= LSM_UNSAFE_PTRACE;
164 }
165 return unsafe;
166 }
167
168 /**
169 * tracehook_tracer_task - return the task that is tracing the given task
170 * @tsk: task to consider
171 *
172 * Returns NULL if no one is tracing @task, or the &struct task_struct
173 * pointer to its tracer.
174 *
175 * Must called under rcu_read_lock(). The pointer returned might be kept
176 * live only by RCU. During exec, this may be called with task_lock()
177 * held on @task, still held from when tracehook_unsafe_exec() was called.
178 */
179 static inline struct task_struct *tracehook_tracer_task(struct task_struct *tsk)
180 {
181 if (tsk->ptrace & PT_PTRACED)
182 return rcu_dereference(tsk->parent);
183 return NULL;
184 }
185
186 /**
187 * tracehook_report_exec - a successful exec was completed
188 * @fmt: &struct linux_binfmt that performed the exec
189 * @bprm: &struct linux_binprm containing exec details
190 * @regs: user-mode register state
191 *
192 * An exec just completed, we are shortly going to return to user mode.
193 * The freshly initialized register state can be seen and changed in @regs.
194 * The name, file and other pointers in @bprm are still on hand to be
195 * inspected, but will be freed as soon as this returns.
196 *
197 * Called with no locks, but with some kernel resources held live
198 * and a reference on @fmt->module.
199 */
200 static inline void tracehook_report_exec(struct linux_binfmt *fmt,
201 struct linux_binprm *bprm,
202 struct pt_regs *regs)
203 {
204 ptrace_event(PTRACE_EVENT_EXEC, 0);
205 }
206
207 /**
208 * tracehook_report_exit - task has begun to exit
209 * @exit_code: pointer to value destined for @current->exit_code
210 *
211 * @exit_code points to the value passed to do_exit(), which tracing
212 * might change here. This is almost the first thing in do_exit(),
213 * before freeing any resources or setting the %PF_EXITING flag.
214 *
215 * Called with no locks held.
216 */
217 static inline void tracehook_report_exit(long *exit_code)
218 {
219 ptrace_event(PTRACE_EVENT_EXIT, *exit_code);
220 }
221
222 /**
223 * tracehook_prepare_clone - prepare for new child to be cloned
224 * @clone_flags: %CLONE_* flags from clone/fork/vfork system call
225 *
226 * This is called before a new user task is to be cloned.
227 * Its return value will be passed to tracehook_finish_clone().
228 *
229 * Called with no locks held.
230 */
231 static inline int tracehook_prepare_clone(unsigned clone_flags)
232 {
233 int event = 0;
234
235 if (clone_flags & CLONE_UNTRACED)
236 return 0;
237
238 if (clone_flags & CLONE_VFORK)
239 event = PTRACE_EVENT_VFORK;
240 else if ((clone_flags & CSIGNAL) != SIGCHLD)
241 event = PTRACE_EVENT_CLONE;
242 else
243 event = PTRACE_EVENT_FORK;
244
245 return ptrace_event_enabled(current, event) ? event : 0;
246 }
247
248 /**
249 * tracehook_finish_clone - new child created and being attached
250 * @child: new child task
251 * @clone_flags: %CLONE_* flags from clone/fork/vfork system call
252 * @trace: return value from tracehook_prepare_clone()
253 *
254 * This is called immediately after adding @child to its parent's children list.
255 * The @trace value is that returned by tracehook_prepare_clone().
256 *
257 * Called with current's siglock and write_lock_irq(&tasklist_lock) held.
258 */
259 static inline void tracehook_finish_clone(struct task_struct *child,
260 unsigned long clone_flags, int trace)
261 {
262 ptrace_init_task(child, (clone_flags & CLONE_PTRACE) || trace);
263 }
264
265 /**
266 * tracehook_report_clone - in parent, new child is about to start running
267 * @regs: parent's user register state
268 * @clone_flags: flags from parent's system call
269 * @pid: new child's PID in the parent's namespace
270 * @child: new child task
271 *
272 * Called after a child is set up, but before it has been started running.
273 * This is not a good place to block, because the child has not started
274 * yet. Suspend the child here if desired, and then block in
275 * tracehook_report_clone_complete(). This must prevent the child from
276 * self-reaping if tracehook_report_clone_complete() uses the @child
277 * pointer; otherwise it might have died and been released by the time
278 * tracehook_report_clone_complete() is called.
279 *
280 * Called with no locks held, but the child cannot run until this returns.
281 */
282 static inline void tracehook_report_clone(struct pt_regs *regs,
283 unsigned long clone_flags,
284 pid_t pid, struct task_struct *child)
285 {
286 if (unlikely(child->ptrace)) {
287 /*
288 * It doesn't matter who attached/attaching to this
289 * task, the pending SIGSTOP is right in any case.
290 */
291 sigaddset(&child->pending.signal, SIGSTOP);
292 set_tsk_thread_flag(child, TIF_SIGPENDING);
293 }
294 }
295
296 /**
297 * tracehook_report_clone_complete - new child is running
298 * @trace: return value from tracehook_prepare_clone()
299 * @regs: parent's user register state
300 * @clone_flags: flags from parent's system call
301 * @pid: new child's PID in the parent's namespace
302 * @child: child task, already running
303 *
304 * This is called just after the child has started running. This is
305 * just before the clone/fork syscall returns, or blocks for vfork
306 * child completion if @clone_flags has the %CLONE_VFORK bit set.
307 * The @child pointer may be invalid if a self-reaping child died and
308 * tracehook_report_clone() took no action to prevent it from self-reaping.
309 *
310 * Called with no locks held.
311 */
312 static inline void tracehook_report_clone_complete(int trace,
313 struct pt_regs *regs,
314 unsigned long clone_flags,
315 pid_t pid,
316 struct task_struct *child)
317 {
318 if (unlikely(trace))
319 ptrace_event(trace, pid);
320 }
321
322 /**
323 * tracehook_report_vfork_done - vfork parent's child has exited or exec'd
324 * @child: child task, already running
325 * @pid: new child's PID in the parent's namespace
326 *
327 * Called after a %CLONE_VFORK parent has waited for the child to complete.
328 * The clone/vfork system call will return immediately after this.
329 * The @child pointer may be invalid if a self-reaping child died and
330 * tracehook_report_clone() took no action to prevent it from self-reaping.
331 *
332 * Called with no locks held.
333 */
334 static inline void tracehook_report_vfork_done(struct task_struct *child,
335 pid_t pid)
336 {
337 ptrace_event(PTRACE_EVENT_VFORK_DONE, pid);
338 }
339
340 /**
341 * tracehook_prepare_release_task - task is being reaped, clean up tracing
342 * @task: task in %EXIT_DEAD state
343 *
344 * This is called in release_task() just before @task gets finally reaped
345 * and freed. This would be the ideal place to remove and clean up any
346 * tracing-related state for @task.
347 *
348 * Called with no locks held.
349 */
350 static inline void tracehook_prepare_release_task(struct task_struct *task)
351 {
352 }
353
354 /**
355 * tracehook_finish_release_task - final tracing clean-up
356 * @task: task in %EXIT_DEAD state
357 *
358 * This is called in release_task() when @task is being in the middle of
359 * being reaped. After this, there must be no tracing entanglements.
360 *
361 * Called with write_lock_irq(&tasklist_lock) held.
362 */
363 static inline void tracehook_finish_release_task(struct task_struct *task)
364 {
365 ptrace_release_task(task);
366 }
367
368 /**
369 * tracehook_signal_handler - signal handler setup is complete
370 * @sig: number of signal being delivered
371 * @info: siginfo_t of signal being delivered
372 * @ka: sigaction setting that chose the handler
373 * @regs: user register state
374 * @stepping: nonzero if debugger single-step or block-step in use
375 *
376 * Called by the arch code after a signal handler has been set up.
377 * Register and stack state reflects the user handler about to run.
378 * Signal mask changes have already been made.
379 *
380 * Called without locks, shortly before returning to user mode
381 * (or handling more signals).
382 */
383 static inline void tracehook_signal_handler(int sig, siginfo_t *info,
384 const struct k_sigaction *ka,
385 struct pt_regs *regs, int stepping)
386 {
387 if (stepping)
388 ptrace_notify(SIGTRAP);
389 }
390
391 /**
392 * tracehook_consider_ignored_signal - suppress short-circuit of ignored signal
393 * @task: task receiving the signal
394 * @sig: signal number being sent
395 *
396 * Return zero iff tracing doesn't care to examine this ignored signal,
397 * so it can short-circuit normal delivery and never even get queued.
398 *
399 * Called with @task->sighand->siglock held.
400 */
401 static inline int tracehook_consider_ignored_signal(struct task_struct *task,
402 int sig)
403 {
404 return (task->ptrace & PT_PTRACED) != 0;
405 }
406
407 /**
408 * tracehook_consider_fatal_signal - suppress special handling of fatal signal
409 * @task: task receiving the signal
410 * @sig: signal number being sent
411 *
412 * Return nonzero to prevent special handling of this termination signal.
413 * Normally handler for signal is %SIG_DFL. It can be %SIG_IGN if @sig is
414 * ignored, in which case force_sig() is about to reset it to %SIG_DFL.
415 * When this returns zero, this signal might cause a quick termination
416 * that does not give the debugger a chance to intercept the signal.
417 *
418 * Called with or without @task->sighand->siglock held.
419 */
420 static inline int tracehook_consider_fatal_signal(struct task_struct *task,
421 int sig)
422 {
423 return (task->ptrace & PT_PTRACED) != 0;
424 }
425
426 #define DEATH_REAP -1
427 #define DEATH_DELAYED_GROUP_LEADER -2
428
429 /**
430 * tracehook_notify_death - task is dead, ready to notify parent
431 * @task: @current task now exiting
432 * @death_cookie: value to pass to tracehook_report_death()
433 * @group_dead: nonzero if this was the last thread in the group to die
434 *
435 * A return value >= 0 means call do_notify_parent() with that signal
436 * number. Negative return value can be %DEATH_REAP to self-reap right
437 * now, or %DEATH_DELAYED_GROUP_LEADER to a zombie without notifying our
438 * parent. Note that a return value of 0 means a do_notify_parent() call
439 * that sends no signal, but still wakes up a parent blocked in wait*().
440 *
441 * Called with write_lock_irq(&tasklist_lock) held.
442 */
443 static inline int tracehook_notify_death(struct task_struct *task,
444 void **death_cookie, int group_dead)
445 {
446 if (task_detached(task))
447 return task->ptrace ? SIGCHLD : DEATH_REAP;
448
449 /*
450 * If something other than our normal parent is ptracing us, then
451 * send it a SIGCHLD instead of honoring exit_signal. exit_signal
452 * only has special meaning to our real parent.
453 */
454 if (thread_group_empty(task) && !ptrace_reparented(task))
455 return task->exit_signal;
456
457 return task->ptrace ? SIGCHLD : DEATH_DELAYED_GROUP_LEADER;
458 }
459
460 /**
461 * tracehook_report_death - task is dead and ready to be reaped
462 * @task: @current task now exiting
463 * @signal: return value from tracheook_notify_death()
464 * @death_cookie: value passed back from tracehook_notify_death()
465 * @group_dead: nonzero if this was the last thread in the group to die
466 *
467 * Thread has just become a zombie or is about to self-reap. If positive,
468 * @signal is the signal number just sent to the parent (usually %SIGCHLD).
469 * If @signal is %DEATH_REAP, this thread will self-reap. If @signal is
470 * %DEATH_DELAYED_GROUP_LEADER, this is a delayed_group_leader() zombie.
471 * The @death_cookie was passed back by tracehook_notify_death().
472 *
473 * If normal reaping is not inhibited, @task->exit_state might be changing
474 * in parallel.
475 *
476 * Called without locks.
477 */
478 static inline void tracehook_report_death(struct task_struct *task,
479 int signal, void *death_cookie,
480 int group_dead)
481 {
482 }
483
484 #ifdef TIF_NOTIFY_RESUME
485 /**
486 * set_notify_resume - cause tracehook_notify_resume() to be called
487 * @task: task that will call tracehook_notify_resume()
488 *
489 * Calling this arranges that @task will call tracehook_notify_resume()
490 * before returning to user mode. If it's already running in user mode,
491 * it will enter the kernel and call tracehook_notify_resume() soon.
492 * If it's blocked, it will not be woken.
493 */
494 static inline void set_notify_resume(struct task_struct *task)
495 {
496 if (!test_and_set_tsk_thread_flag(task, TIF_NOTIFY_RESUME))
497 kick_process(task);
498 }
499
500 /**
501 * tracehook_notify_resume - report when about to return to user mode
502 * @regs: user-mode registers of @current task
503 *
504 * This is called when %TIF_NOTIFY_RESUME has been set. Now we are
505 * about to return to user mode, and the user state in @regs can be
506 * inspected or adjusted. The caller in arch code has cleared
507 * %TIF_NOTIFY_RESUME before the call. If the flag gets set again
508 * asynchronously, this will be called again before we return to
509 * user mode.
510 *
511 * Called without locks.
512 */
513 static inline void tracehook_notify_resume(struct pt_regs *regs)
514 {
515 }
516 #endif /* TIF_NOTIFY_RESUME */
517
518 #endif /* <linux/tracehook.h> */