tracehook.h 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518
  1. /*
  2. * Tracing hooks
  3. *
  4. * Copyright (C) 2008-2009 Red Hat, Inc. All rights reserved.
  5. *
  6. * This copyrighted material is made available to anyone wishing to use,
  7. * modify, copy, or redistribute it subject to the terms and conditions
  8. * of the GNU General Public License v.2.
  9. *
  10. * This file defines hook entry points called by core code where
  11. * user tracing/debugging support might need to do something. These
  12. * entry points are called tracehook_*(). Each hook declared below
  13. * has a detailed kerneldoc comment giving the context (locking et
  14. * al) from which it is called, and the meaning of its return value.
  15. *
  16. * Each function here typically has only one call site, so it is ok
  17. * to have some nontrivial tracehook_*() inlines. In all cases, the
  18. * fast path when no tracing is enabled should be very short.
  19. *
  20. * The purpose of this file and the tracehook_* layer is to consolidate
  21. * the interface that the kernel core and arch code uses to enable any
  22. * user debugging or tracing facility (such as ptrace). The interfaces
  23. * here are carefully documented so that maintainers of core and arch
  24. * code do not need to think about the implementation details of the
  25. * tracing facilities. Likewise, maintainers of the tracing code do not
  26. * need to understand all the calling core or arch code in detail, just
  27. * documented circumstances of each call, such as locking conditions.
  28. *
  29. * If the calling core code changes so that locking is different, then
  30. * it is ok to change the interface documented here. The maintainer of
  31. * core code changing should notify the maintainers of the tracing code
  32. * that they need to work out the change.
  33. *
  34. * Some tracehook_*() inlines take arguments that the current tracing
  35. * implementations might not necessarily use. These function signatures
  36. * are chosen to pass in all the information that is on hand in the
  37. * caller and might conceivably be relevant to a tracer, so that the
  38. * core code won't have to be updated when tracing adds more features.
  39. * If a call site changes so that some of those parameters are no longer
  40. * already on hand without extra work, then the tracehook_* interface
  41. * can change so there is no make-work burden on the core code. The
  42. * maintainer of core code changing should notify the maintainers of the
  43. * tracing code that they need to work out the change.
  44. */
  45. #ifndef _LINUX_TRACEHOOK_H
  46. #define _LINUX_TRACEHOOK_H 1
  47. #include <linux/sched.h>
  48. #include <linux/ptrace.h>
  49. #include <linux/security.h>
  50. struct linux_binprm;
  51. /**
  52. * tracehook_expect_breakpoints - guess if task memory might be touched
  53. * @task: current task, making a new mapping
  54. *
  55. * Return nonzero if @task is expected to want breakpoint insertion in
  56. * its memory at some point. A zero return is no guarantee it won't
  57. * be done, but this is a hint that it's known to be likely.
  58. *
  59. * May be called with @task->mm->mmap_sem held for writing.
  60. */
  61. static inline int tracehook_expect_breakpoints(struct task_struct *task)
  62. {
  63. return (task->ptrace & PT_PTRACED) != 0;
  64. }
  65. /*
  66. * ptrace report for syscall entry and exit looks identical.
  67. */
  68. static inline void ptrace_report_syscall(struct pt_regs *regs)
  69. {
  70. int ptrace = current->ptrace;
  71. if (!(ptrace & PT_PTRACED))
  72. return;
  73. ptrace_notify(SIGTRAP | ((ptrace & PT_TRACESYSGOOD) ? 0x80 : 0));
  74. /*
  75. * this isn't the same as continuing with a signal, but it will do
  76. * for normal use. strace only continues with a signal if the
  77. * stopping signal is not SIGTRAP. -brl
  78. */
  79. if (current->exit_code) {
  80. send_sig(current->exit_code, current, 1);
  81. current->exit_code = 0;
  82. }
  83. }
  84. /**
  85. * tracehook_report_syscall_entry - task is about to attempt a system call
  86. * @regs: user register state of current task
  87. *
  88. * This will be called if %TIF_SYSCALL_TRACE has been set, when the
  89. * current task has just entered the kernel for a system call.
  90. * Full user register state is available here. Changing the values
  91. * in @regs can affect the system call number and arguments to be tried.
  92. * It is safe to block here, preventing the system call from beginning.
  93. *
  94. * Returns zero normally, or nonzero if the calling arch code should abort
  95. * the system call. That must prevent normal entry so no system call is
  96. * made. If @task ever returns to user mode after this, its register state
  97. * is unspecified, but should be something harmless like an %ENOSYS error
  98. * return. It should preserve enough information so that syscall_rollback()
  99. * can work (see asm-generic/syscall.h).
  100. *
  101. * Called without locks, just after entering kernel mode.
  102. */
  103. static inline __must_check int tracehook_report_syscall_entry(
  104. struct pt_regs *regs)
  105. {
  106. ptrace_report_syscall(regs);
  107. return 0;
  108. }
  109. /**
  110. * tracehook_report_syscall_exit - task has just finished a system call
  111. * @regs: user register state of current task
  112. * @step: nonzero if simulating single-step or block-step
  113. *
  114. * This will be called if %TIF_SYSCALL_TRACE has been set, when the
  115. * current task has just finished an attempted system call. Full
  116. * user register state is available here. It is safe to block here,
  117. * preventing signals from being processed.
  118. *
  119. * If @step is nonzero, this report is also in lieu of the normal
  120. * trap that would follow the system call instruction because
  121. * user_enable_block_step() or user_enable_single_step() was used.
  122. * In this case, %TIF_SYSCALL_TRACE might not be set.
  123. *
  124. * Called without locks, just before checking for pending signals.
  125. */
  126. static inline void tracehook_report_syscall_exit(struct pt_regs *regs, int step)
  127. {
  128. if (step) {
  129. siginfo_t info;
  130. user_single_step_siginfo(current, regs, &info);
  131. force_sig_info(SIGTRAP, &info, current);
  132. return;
  133. }
  134. ptrace_report_syscall(regs);
  135. }
  136. /**
  137. * tracehook_unsafe_exec - check for exec declared unsafe due to tracing
  138. * @task: current task doing exec
  139. *
  140. * Return %LSM_UNSAFE_* bits applied to an exec because of tracing.
  141. *
  142. * @task->signal->cred_guard_mutex is held by the caller through the do_execve().
  143. */
  144. static inline int tracehook_unsafe_exec(struct task_struct *task)
  145. {
  146. int unsafe = 0;
  147. int ptrace = task->ptrace;
  148. if (ptrace & PT_PTRACED) {
  149. if (ptrace & PT_PTRACE_CAP)
  150. unsafe |= LSM_UNSAFE_PTRACE_CAP;
  151. else
  152. unsafe |= LSM_UNSAFE_PTRACE;
  153. }
  154. return unsafe;
  155. }
  156. /**
  157. * tracehook_tracer_task - return the task that is tracing the given task
  158. * @tsk: task to consider
  159. *
  160. * Returns NULL if no one is tracing @task, or the &struct task_struct
  161. * pointer to its tracer.
  162. *
  163. * Must called under rcu_read_lock(). The pointer returned might be kept
  164. * live only by RCU. During exec, this may be called with task_lock()
  165. * held on @task, still held from when tracehook_unsafe_exec() was called.
  166. */
  167. static inline struct task_struct *tracehook_tracer_task(struct task_struct *tsk)
  168. {
  169. if (tsk->ptrace & PT_PTRACED)
  170. return rcu_dereference(tsk->parent);
  171. return NULL;
  172. }
  173. /**
  174. * tracehook_report_exec - a successful exec was completed
  175. * @fmt: &struct linux_binfmt that performed the exec
  176. * @bprm: &struct linux_binprm containing exec details
  177. * @regs: user-mode register state
  178. *
  179. * An exec just completed, we are shortly going to return to user mode.
  180. * The freshly initialized register state can be seen and changed in @regs.
  181. * The name, file and other pointers in @bprm are still on hand to be
  182. * inspected, but will be freed as soon as this returns.
  183. *
  184. * Called with no locks, but with some kernel resources held live
  185. * and a reference on @fmt->module.
  186. */
  187. static inline void tracehook_report_exec(struct linux_binfmt *fmt,
  188. struct linux_binprm *bprm,
  189. struct pt_regs *regs)
  190. {
  191. ptrace_event(PTRACE_EVENT_EXEC, 0);
  192. }
  193. /**
  194. * tracehook_report_exit - task has begun to exit
  195. * @exit_code: pointer to value destined for @current->exit_code
  196. *
  197. * @exit_code points to the value passed to do_exit(), which tracing
  198. * might change here. This is almost the first thing in do_exit(),
  199. * before freeing any resources or setting the %PF_EXITING flag.
  200. *
  201. * Called with no locks held.
  202. */
  203. static inline void tracehook_report_exit(long *exit_code)
  204. {
  205. ptrace_event(PTRACE_EVENT_EXIT, *exit_code);
  206. }
  207. /**
  208. * tracehook_prepare_clone - prepare for new child to be cloned
  209. * @clone_flags: %CLONE_* flags from clone/fork/vfork system call
  210. *
  211. * This is called before a new user task is to be cloned.
  212. * Its return value will be passed to tracehook_finish_clone().
  213. *
  214. * Called with no locks held.
  215. */
  216. static inline int tracehook_prepare_clone(unsigned clone_flags)
  217. {
  218. int event = 0;
  219. if (clone_flags & CLONE_UNTRACED)
  220. return 0;
  221. if (clone_flags & CLONE_VFORK)
  222. event = PTRACE_EVENT_VFORK;
  223. else if ((clone_flags & CSIGNAL) != SIGCHLD)
  224. event = PTRACE_EVENT_CLONE;
  225. else
  226. event = PTRACE_EVENT_FORK;
  227. return ptrace_event_enabled(current, event) ? event : 0;
  228. }
  229. /**
  230. * tracehook_finish_clone - new child created and being attached
  231. * @child: new child task
  232. * @clone_flags: %CLONE_* flags from clone/fork/vfork system call
  233. * @trace: return value from tracehook_prepare_clone()
  234. *
  235. * This is called immediately after adding @child to its parent's children list.
  236. * The @trace value is that returned by tracehook_prepare_clone().
  237. *
  238. * Called with current's siglock and write_lock_irq(&tasklist_lock) held.
  239. */
  240. static inline void tracehook_finish_clone(struct task_struct *child,
  241. unsigned long clone_flags, int trace)
  242. {
  243. ptrace_init_task(child, (clone_flags & CLONE_PTRACE) || trace);
  244. }
  245. /**
  246. * tracehook_report_clone - in parent, new child is about to start running
  247. * @regs: parent's user register state
  248. * @clone_flags: flags from parent's system call
  249. * @pid: new child's PID in the parent's namespace
  250. * @child: new child task
  251. *
  252. * Called after a child is set up, but before it has been started running.
  253. * This is not a good place to block, because the child has not started
  254. * yet. Suspend the child here if desired, and then block in
  255. * tracehook_report_clone_complete(). This must prevent the child from
  256. * self-reaping if tracehook_report_clone_complete() uses the @child
  257. * pointer; otherwise it might have died and been released by the time
  258. * tracehook_report_clone_complete() is called.
  259. *
  260. * Called with no locks held, but the child cannot run until this returns.
  261. */
  262. static inline void tracehook_report_clone(struct pt_regs *regs,
  263. unsigned long clone_flags,
  264. pid_t pid, struct task_struct *child)
  265. {
  266. if (unlikely(child->ptrace)) {
  267. /*
  268. * It doesn't matter who attached/attaching to this
  269. * task, the pending SIGSTOP is right in any case.
  270. */
  271. sigaddset(&child->pending.signal, SIGSTOP);
  272. set_tsk_thread_flag(child, TIF_SIGPENDING);
  273. }
  274. }
  275. /**
  276. * tracehook_report_clone_complete - new child is running
  277. * @trace: return value from tracehook_prepare_clone()
  278. * @regs: parent's user register state
  279. * @clone_flags: flags from parent's system call
  280. * @pid: new child's PID in the parent's namespace
  281. * @child: child task, already running
  282. *
  283. * This is called just after the child has started running. This is
  284. * just before the clone/fork syscall returns, or blocks for vfork
  285. * child completion if @clone_flags has the %CLONE_VFORK bit set.
  286. * The @child pointer may be invalid if a self-reaping child died and
  287. * tracehook_report_clone() took no action to prevent it from self-reaping.
  288. *
  289. * Called with no locks held.
  290. */
  291. static inline void tracehook_report_clone_complete(int trace,
  292. struct pt_regs *regs,
  293. unsigned long clone_flags,
  294. pid_t pid,
  295. struct task_struct *child)
  296. {
  297. if (unlikely(trace))
  298. ptrace_event(trace, pid);
  299. }
  300. /**
  301. * tracehook_report_vfork_done - vfork parent's child has exited or exec'd
  302. * @child: child task, already running
  303. * @pid: new child's PID in the parent's namespace
  304. *
  305. * Called after a %CLONE_VFORK parent has waited for the child to complete.
  306. * The clone/vfork system call will return immediately after this.
  307. * The @child pointer may be invalid if a self-reaping child died and
  308. * tracehook_report_clone() took no action to prevent it from self-reaping.
  309. *
  310. * Called with no locks held.
  311. */
  312. static inline void tracehook_report_vfork_done(struct task_struct *child,
  313. pid_t pid)
  314. {
  315. ptrace_event(PTRACE_EVENT_VFORK_DONE, pid);
  316. }
  317. /**
  318. * tracehook_prepare_release_task - task is being reaped, clean up tracing
  319. * @task: task in %EXIT_DEAD state
  320. *
  321. * This is called in release_task() just before @task gets finally reaped
  322. * and freed. This would be the ideal place to remove and clean up any
  323. * tracing-related state for @task.
  324. *
  325. * Called with no locks held.
  326. */
  327. static inline void tracehook_prepare_release_task(struct task_struct *task)
  328. {
  329. }
  330. /**
  331. * tracehook_finish_release_task - final tracing clean-up
  332. * @task: task in %EXIT_DEAD state
  333. *
  334. * This is called in release_task() when @task is being in the middle of
  335. * being reaped. After this, there must be no tracing entanglements.
  336. *
  337. * Called with write_lock_irq(&tasklist_lock) held.
  338. */
  339. static inline void tracehook_finish_release_task(struct task_struct *task)
  340. {
  341. ptrace_release_task(task);
  342. }
  343. /**
  344. * tracehook_signal_handler - signal handler setup is complete
  345. * @sig: number of signal being delivered
  346. * @info: siginfo_t of signal being delivered
  347. * @ka: sigaction setting that chose the handler
  348. * @regs: user register state
  349. * @stepping: nonzero if debugger single-step or block-step in use
  350. *
  351. * Called by the arch code after a signal handler has been set up.
  352. * Register and stack state reflects the user handler about to run.
  353. * Signal mask changes have already been made.
  354. *
  355. * Called without locks, shortly before returning to user mode
  356. * (or handling more signals).
  357. */
  358. static inline void tracehook_signal_handler(int sig, siginfo_t *info,
  359. const struct k_sigaction *ka,
  360. struct pt_regs *regs, int stepping)
  361. {
  362. if (stepping)
  363. ptrace_notify(SIGTRAP);
  364. }
  365. /**
  366. * tracehook_consider_ignored_signal - suppress short-circuit of ignored signal
  367. * @task: task receiving the signal
  368. * @sig: signal number being sent
  369. *
  370. * Return zero iff tracing doesn't care to examine this ignored signal,
  371. * so it can short-circuit normal delivery and never even get queued.
  372. *
  373. * Called with @task->sighand->siglock held.
  374. */
  375. static inline int tracehook_consider_ignored_signal(struct task_struct *task,
  376. int sig)
  377. {
  378. return (task->ptrace & PT_PTRACED) != 0;
  379. }
  380. /**
  381. * tracehook_consider_fatal_signal - suppress special handling of fatal signal
  382. * @task: task receiving the signal
  383. * @sig: signal number being sent
  384. *
  385. * Return nonzero to prevent special handling of this termination signal.
  386. * Normally handler for signal is %SIG_DFL. It can be %SIG_IGN if @sig is
  387. * ignored, in which case force_sig() is about to reset it to %SIG_DFL.
  388. * When this returns zero, this signal might cause a quick termination
  389. * that does not give the debugger a chance to intercept the signal.
  390. *
  391. * Called with or without @task->sighand->siglock held.
  392. */
  393. static inline int tracehook_consider_fatal_signal(struct task_struct *task,
  394. int sig)
  395. {
  396. return (task->ptrace & PT_PTRACED) != 0;
  397. }
  398. #define DEATH_REAP -1
  399. #define DEATH_DELAYED_GROUP_LEADER -2
  400. /**
  401. * tracehook_notify_death - task is dead, ready to notify parent
  402. * @task: @current task now exiting
  403. * @death_cookie: value to pass to tracehook_report_death()
  404. * @group_dead: nonzero if this was the last thread in the group to die
  405. *
  406. * A return value >= 0 means call do_notify_parent() with that signal
  407. * number. Negative return value can be %DEATH_REAP to self-reap right
  408. * now, or %DEATH_DELAYED_GROUP_LEADER to a zombie without notifying our
  409. * parent. Note that a return value of 0 means a do_notify_parent() call
  410. * that sends no signal, but still wakes up a parent blocked in wait*().
  411. *
  412. * Called with write_lock_irq(&tasklist_lock) held.
  413. */
  414. static inline int tracehook_notify_death(struct task_struct *task,
  415. void **death_cookie, int group_dead)
  416. {
  417. if (task_detached(task))
  418. return task->ptrace ? SIGCHLD : DEATH_REAP;
  419. /*
  420. * If something other than our normal parent is ptracing us, then
  421. * send it a SIGCHLD instead of honoring exit_signal. exit_signal
  422. * only has special meaning to our real parent.
  423. */
  424. if (thread_group_empty(task) && !ptrace_reparented(task))
  425. return task->exit_signal;
  426. return task->ptrace ? SIGCHLD : DEATH_DELAYED_GROUP_LEADER;
  427. }
  428. /**
  429. * tracehook_report_death - task is dead and ready to be reaped
  430. * @task: @current task now exiting
  431. * @signal: return value from tracheook_notify_death()
  432. * @death_cookie: value passed back from tracehook_notify_death()
  433. * @group_dead: nonzero if this was the last thread in the group to die
  434. *
  435. * Thread has just become a zombie or is about to self-reap. If positive,
  436. * @signal is the signal number just sent to the parent (usually %SIGCHLD).
  437. * If @signal is %DEATH_REAP, this thread will self-reap. If @signal is
  438. * %DEATH_DELAYED_GROUP_LEADER, this is a delayed_group_leader() zombie.
  439. * The @death_cookie was passed back by tracehook_notify_death().
  440. *
  441. * If normal reaping is not inhibited, @task->exit_state might be changing
  442. * in parallel.
  443. *
  444. * Called without locks.
  445. */
  446. static inline void tracehook_report_death(struct task_struct *task,
  447. int signal, void *death_cookie,
  448. int group_dead)
  449. {
  450. }
  451. #ifdef TIF_NOTIFY_RESUME
  452. /**
  453. * set_notify_resume - cause tracehook_notify_resume() to be called
  454. * @task: task that will call tracehook_notify_resume()
  455. *
  456. * Calling this arranges that @task will call tracehook_notify_resume()
  457. * before returning to user mode. If it's already running in user mode,
  458. * it will enter the kernel and call tracehook_notify_resume() soon.
  459. * If it's blocked, it will not be woken.
  460. */
  461. static inline void set_notify_resume(struct task_struct *task)
  462. {
  463. if (!test_and_set_tsk_thread_flag(task, TIF_NOTIFY_RESUME))
  464. kick_process(task);
  465. }
  466. /**
  467. * tracehook_notify_resume - report when about to return to user mode
  468. * @regs: user-mode registers of @current task
  469. *
  470. * This is called when %TIF_NOTIFY_RESUME has been set. Now we are
  471. * about to return to user mode, and the user state in @regs can be
  472. * inspected or adjusted. The caller in arch code has cleared
  473. * %TIF_NOTIFY_RESUME before the call. If the flag gets set again
  474. * asynchronously, this will be called again before we return to
  475. * user mode.
  476. *
  477. * Called without locks.
  478. */
  479. static inline void tracehook_notify_resume(struct pt_regs *regs)
  480. {
  481. }
  482. #endif /* TIF_NOTIFY_RESUME */
  483. #endif /* <linux/tracehook.h> */