ptrace.c 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548
  1. /* By Ross Biro 1/23/92 */
  2. /*
  3. * Pentium III FXSR, SSE support
  4. * Gareth Hughes <gareth@valinux.com>, May 2000
  5. *
  6. * BTS tracing
  7. * Markus Metzger <markus.t.metzger@intel.com>, Dec 2007
  8. */
  9. #include <linux/kernel.h>
  10. #include <linux/sched.h>
  11. #include <linux/mm.h>
  12. #include <linux/smp.h>
  13. #include <linux/errno.h>
  14. #include <linux/ptrace.h>
  15. #include <linux/regset.h>
  16. #include <linux/tracehook.h>
  17. #include <linux/user.h>
  18. #include <linux/elf.h>
  19. #include <linux/security.h>
  20. #include <linux/audit.h>
  21. #include <linux/seccomp.h>
  22. #include <linux/signal.h>
  23. #include <linux/workqueue.h>
  24. #include <asm/uaccess.h>
  25. #include <asm/pgtable.h>
  26. #include <asm/system.h>
  27. #include <asm/processor.h>
  28. #include <asm/i387.h>
  29. #include <asm/debugreg.h>
  30. #include <asm/ldt.h>
  31. #include <asm/desc.h>
  32. #include <asm/prctl.h>
  33. #include <asm/proto.h>
  34. #include <asm/ds.h>
  35. #include <trace/syscall.h>
  36. #include "tls.h"
  37. enum x86_regset {
  38. REGSET_GENERAL,
  39. REGSET_FP,
  40. REGSET_XFP,
  41. REGSET_IOPERM64 = REGSET_XFP,
  42. REGSET_TLS,
  43. REGSET_IOPERM32,
  44. };
  45. /*
  46. * does not yet catch signals sent when the child dies.
  47. * in exit.c or in signal.c.
  48. */
  49. /*
  50. * Determines which flags the user has access to [1 = access, 0 = no access].
  51. */
  52. #define FLAG_MASK_32 ((unsigned long) \
  53. (X86_EFLAGS_CF | X86_EFLAGS_PF | \
  54. X86_EFLAGS_AF | X86_EFLAGS_ZF | \
  55. X86_EFLAGS_SF | X86_EFLAGS_TF | \
  56. X86_EFLAGS_DF | X86_EFLAGS_OF | \
  57. X86_EFLAGS_RF | X86_EFLAGS_AC))
  58. /*
  59. * Determines whether a value may be installed in a segment register.
  60. */
  61. static inline bool invalid_selector(u16 value)
  62. {
  63. return unlikely(value != 0 && (value & SEGMENT_RPL_MASK) != USER_RPL);
  64. }
  65. #ifdef CONFIG_X86_32
  66. #define FLAG_MASK FLAG_MASK_32
  67. static unsigned long *pt_regs_access(struct pt_regs *regs, unsigned long regno)
  68. {
  69. BUILD_BUG_ON(offsetof(struct pt_regs, bx) != 0);
  70. return &regs->bx + (regno >> 2);
  71. }
  72. static u16 get_segment_reg(struct task_struct *task, unsigned long offset)
  73. {
  74. /*
  75. * Returning the value truncates it to 16 bits.
  76. */
  77. unsigned int retval;
  78. if (offset != offsetof(struct user_regs_struct, gs))
  79. retval = *pt_regs_access(task_pt_regs(task), offset);
  80. else {
  81. if (task == current)
  82. retval = get_user_gs(task_pt_regs(task));
  83. else
  84. retval = task_user_gs(task);
  85. }
  86. return retval;
  87. }
  88. static int set_segment_reg(struct task_struct *task,
  89. unsigned long offset, u16 value)
  90. {
  91. /*
  92. * The value argument was already truncated to 16 bits.
  93. */
  94. if (invalid_selector(value))
  95. return -EIO;
  96. /*
  97. * For %cs and %ss we cannot permit a null selector.
  98. * We can permit a bogus selector as long as it has USER_RPL.
  99. * Null selectors are fine for other segment registers, but
  100. * we will never get back to user mode with invalid %cs or %ss
  101. * and will take the trap in iret instead. Much code relies
  102. * on user_mode() to distinguish a user trap frame (which can
  103. * safely use invalid selectors) from a kernel trap frame.
  104. */
  105. switch (offset) {
  106. case offsetof(struct user_regs_struct, cs):
  107. case offsetof(struct user_regs_struct, ss):
  108. if (unlikely(value == 0))
  109. return -EIO;
  110. default:
  111. *pt_regs_access(task_pt_regs(task), offset) = value;
  112. break;
  113. case offsetof(struct user_regs_struct, gs):
  114. if (task == current)
  115. set_user_gs(task_pt_regs(task), value);
  116. else
  117. task_user_gs(task) = value;
  118. }
  119. return 0;
  120. }
  121. static unsigned long debugreg_addr_limit(struct task_struct *task)
  122. {
  123. return TASK_SIZE - 3;
  124. }
  125. #else /* CONFIG_X86_64 */
  126. #define FLAG_MASK (FLAG_MASK_32 | X86_EFLAGS_NT)
  127. static unsigned long *pt_regs_access(struct pt_regs *regs, unsigned long offset)
  128. {
  129. BUILD_BUG_ON(offsetof(struct pt_regs, r15) != 0);
  130. return &regs->r15 + (offset / sizeof(regs->r15));
  131. }
  132. static u16 get_segment_reg(struct task_struct *task, unsigned long offset)
  133. {
  134. /*
  135. * Returning the value truncates it to 16 bits.
  136. */
  137. unsigned int seg;
  138. switch (offset) {
  139. case offsetof(struct user_regs_struct, fs):
  140. if (task == current) {
  141. /* Older gas can't assemble movq %?s,%r?? */
  142. asm("movl %%fs,%0" : "=r" (seg));
  143. return seg;
  144. }
  145. return task->thread.fsindex;
  146. case offsetof(struct user_regs_struct, gs):
  147. if (task == current) {
  148. asm("movl %%gs,%0" : "=r" (seg));
  149. return seg;
  150. }
  151. return task->thread.gsindex;
  152. case offsetof(struct user_regs_struct, ds):
  153. if (task == current) {
  154. asm("movl %%ds,%0" : "=r" (seg));
  155. return seg;
  156. }
  157. return task->thread.ds;
  158. case offsetof(struct user_regs_struct, es):
  159. if (task == current) {
  160. asm("movl %%es,%0" : "=r" (seg));
  161. return seg;
  162. }
  163. return task->thread.es;
  164. case offsetof(struct user_regs_struct, cs):
  165. case offsetof(struct user_regs_struct, ss):
  166. break;
  167. }
  168. return *pt_regs_access(task_pt_regs(task), offset);
  169. }
  170. static int set_segment_reg(struct task_struct *task,
  171. unsigned long offset, u16 value)
  172. {
  173. /*
  174. * The value argument was already truncated to 16 bits.
  175. */
  176. if (invalid_selector(value))
  177. return -EIO;
  178. switch (offset) {
  179. case offsetof(struct user_regs_struct,fs):
  180. /*
  181. * If this is setting fs as for normal 64-bit use but
  182. * setting fs_base has implicitly changed it, leave it.
  183. */
  184. if ((value == FS_TLS_SEL && task->thread.fsindex == 0 &&
  185. task->thread.fs != 0) ||
  186. (value == 0 && task->thread.fsindex == FS_TLS_SEL &&
  187. task->thread.fs == 0))
  188. break;
  189. task->thread.fsindex = value;
  190. if (task == current)
  191. loadsegment(fs, task->thread.fsindex);
  192. break;
  193. case offsetof(struct user_regs_struct,gs):
  194. /*
  195. * If this is setting gs as for normal 64-bit use but
  196. * setting gs_base has implicitly changed it, leave it.
  197. */
  198. if ((value == GS_TLS_SEL && task->thread.gsindex == 0 &&
  199. task->thread.gs != 0) ||
  200. (value == 0 && task->thread.gsindex == GS_TLS_SEL &&
  201. task->thread.gs == 0))
  202. break;
  203. task->thread.gsindex = value;
  204. if (task == current)
  205. load_gs_index(task->thread.gsindex);
  206. break;
  207. case offsetof(struct user_regs_struct,ds):
  208. task->thread.ds = value;
  209. if (task == current)
  210. loadsegment(ds, task->thread.ds);
  211. break;
  212. case offsetof(struct user_regs_struct,es):
  213. task->thread.es = value;
  214. if (task == current)
  215. loadsegment(es, task->thread.es);
  216. break;
  217. /*
  218. * Can't actually change these in 64-bit mode.
  219. */
  220. case offsetof(struct user_regs_struct,cs):
  221. if (unlikely(value == 0))
  222. return -EIO;
  223. #ifdef CONFIG_IA32_EMULATION
  224. if (test_tsk_thread_flag(task, TIF_IA32))
  225. task_pt_regs(task)->cs = value;
  226. #endif
  227. break;
  228. case offsetof(struct user_regs_struct,ss):
  229. if (unlikely(value == 0))
  230. return -EIO;
  231. #ifdef CONFIG_IA32_EMULATION
  232. if (test_tsk_thread_flag(task, TIF_IA32))
  233. task_pt_regs(task)->ss = value;
  234. #endif
  235. break;
  236. }
  237. return 0;
  238. }
  239. static unsigned long debugreg_addr_limit(struct task_struct *task)
  240. {
  241. #ifdef CONFIG_IA32_EMULATION
  242. if (test_tsk_thread_flag(task, TIF_IA32))
  243. return IA32_PAGE_OFFSET - 3;
  244. #endif
  245. return TASK_SIZE_MAX - 7;
  246. }
  247. #endif /* CONFIG_X86_32 */
  248. static unsigned long get_flags(struct task_struct *task)
  249. {
  250. unsigned long retval = task_pt_regs(task)->flags;
  251. /*
  252. * If the debugger set TF, hide it from the readout.
  253. */
  254. if (test_tsk_thread_flag(task, TIF_FORCED_TF))
  255. retval &= ~X86_EFLAGS_TF;
  256. return retval;
  257. }
  258. static int set_flags(struct task_struct *task, unsigned long value)
  259. {
  260. struct pt_regs *regs = task_pt_regs(task);
  261. /*
  262. * If the user value contains TF, mark that
  263. * it was not "us" (the debugger) that set it.
  264. * If not, make sure it stays set if we had.
  265. */
  266. if (value & X86_EFLAGS_TF)
  267. clear_tsk_thread_flag(task, TIF_FORCED_TF);
  268. else if (test_tsk_thread_flag(task, TIF_FORCED_TF))
  269. value |= X86_EFLAGS_TF;
  270. regs->flags = (regs->flags & ~FLAG_MASK) | (value & FLAG_MASK);
  271. return 0;
  272. }
  273. static int putreg(struct task_struct *child,
  274. unsigned long offset, unsigned long value)
  275. {
  276. switch (offset) {
  277. case offsetof(struct user_regs_struct, cs):
  278. case offsetof(struct user_regs_struct, ds):
  279. case offsetof(struct user_regs_struct, es):
  280. case offsetof(struct user_regs_struct, fs):
  281. case offsetof(struct user_regs_struct, gs):
  282. case offsetof(struct user_regs_struct, ss):
  283. return set_segment_reg(child, offset, value);
  284. case offsetof(struct user_regs_struct, flags):
  285. return set_flags(child, value);
  286. #ifdef CONFIG_X86_64
  287. /*
  288. * Orig_ax is really just a flag with small positive and
  289. * negative values, so make sure to always sign-extend it
  290. * from 32 bits so that it works correctly regardless of
  291. * whether we come from a 32-bit environment or not.
  292. */
  293. case offsetof(struct user_regs_struct, orig_ax):
  294. value = (long) (s32) value;
  295. break;
  296. case offsetof(struct user_regs_struct,fs_base):
  297. if (value >= TASK_SIZE_OF(child))
  298. return -EIO;
  299. /*
  300. * When changing the segment base, use do_arch_prctl
  301. * to set either thread.fs or thread.fsindex and the
  302. * corresponding GDT slot.
  303. */
  304. if (child->thread.fs != value)
  305. return do_arch_prctl(child, ARCH_SET_FS, value);
  306. return 0;
  307. case offsetof(struct user_regs_struct,gs_base):
  308. /*
  309. * Exactly the same here as the %fs handling above.
  310. */
  311. if (value >= TASK_SIZE_OF(child))
  312. return -EIO;
  313. if (child->thread.gs != value)
  314. return do_arch_prctl(child, ARCH_SET_GS, value);
  315. return 0;
  316. #endif
  317. }
  318. *pt_regs_access(task_pt_regs(child), offset) = value;
  319. return 0;
  320. }
  321. static unsigned long getreg(struct task_struct *task, unsigned long offset)
  322. {
  323. switch (offset) {
  324. case offsetof(struct user_regs_struct, cs):
  325. case offsetof(struct user_regs_struct, ds):
  326. case offsetof(struct user_regs_struct, es):
  327. case offsetof(struct user_regs_struct, fs):
  328. case offsetof(struct user_regs_struct, gs):
  329. case offsetof(struct user_regs_struct, ss):
  330. return get_segment_reg(task, offset);
  331. case offsetof(struct user_regs_struct, flags):
  332. return get_flags(task);
  333. #ifdef CONFIG_X86_64
  334. case offsetof(struct user_regs_struct, fs_base): {
  335. /*
  336. * do_arch_prctl may have used a GDT slot instead of
  337. * the MSR. To userland, it appears the same either
  338. * way, except the %fs segment selector might not be 0.
  339. */
  340. unsigned int seg = task->thread.fsindex;
  341. if (task->thread.fs != 0)
  342. return task->thread.fs;
  343. if (task == current)
  344. asm("movl %%fs,%0" : "=r" (seg));
  345. if (seg != FS_TLS_SEL)
  346. return 0;
  347. return get_desc_base(&task->thread.tls_array[FS_TLS]);
  348. }
  349. case offsetof(struct user_regs_struct, gs_base): {
  350. /*
  351. * Exactly the same here as the %fs handling above.
  352. */
  353. unsigned int seg = task->thread.gsindex;
  354. if (task->thread.gs != 0)
  355. return task->thread.gs;
  356. if (task == current)
  357. asm("movl %%gs,%0" : "=r" (seg));
  358. if (seg != GS_TLS_SEL)
  359. return 0;
  360. return get_desc_base(&task->thread.tls_array[GS_TLS]);
  361. }
  362. #endif
  363. }
  364. return *pt_regs_access(task_pt_regs(task), offset);
  365. }
  366. static int genregs_get(struct task_struct *target,
  367. const struct user_regset *regset,
  368. unsigned int pos, unsigned int count,
  369. void *kbuf, void __user *ubuf)
  370. {
  371. if (kbuf) {
  372. unsigned long *k = kbuf;
  373. while (count > 0) {
  374. *k++ = getreg(target, pos);
  375. count -= sizeof(*k);
  376. pos += sizeof(*k);
  377. }
  378. } else {
  379. unsigned long __user *u = ubuf;
  380. while (count > 0) {
  381. if (__put_user(getreg(target, pos), u++))
  382. return -EFAULT;
  383. count -= sizeof(*u);
  384. pos += sizeof(*u);
  385. }
  386. }
  387. return 0;
  388. }
  389. static int genregs_set(struct task_struct *target,
  390. const struct user_regset *regset,
  391. unsigned int pos, unsigned int count,
  392. const void *kbuf, const void __user *ubuf)
  393. {
  394. int ret = 0;
  395. if (kbuf) {
  396. const unsigned long *k = kbuf;
  397. while (count > 0 && !ret) {
  398. ret = putreg(target, pos, *k++);
  399. count -= sizeof(*k);
  400. pos += sizeof(*k);
  401. }
  402. } else {
  403. const unsigned long __user *u = ubuf;
  404. while (count > 0 && !ret) {
  405. unsigned long word;
  406. ret = __get_user(word, u++);
  407. if (ret)
  408. break;
  409. ret = putreg(target, pos, word);
  410. count -= sizeof(*u);
  411. pos += sizeof(*u);
  412. }
  413. }
  414. return ret;
  415. }
  416. /*
  417. * This function is trivial and will be inlined by the compiler.
  418. * Having it separates the implementation details of debug
  419. * registers from the interface details of ptrace.
  420. */
  421. static unsigned long ptrace_get_debugreg(struct task_struct *child, int n)
  422. {
  423. switch (n) {
  424. case 0: return child->thread.debugreg0;
  425. case 1: return child->thread.debugreg1;
  426. case 2: return child->thread.debugreg2;
  427. case 3: return child->thread.debugreg3;
  428. case 6: return child->thread.debugreg6;
  429. case 7: return child->thread.debugreg7;
  430. }
  431. return 0;
  432. }
  433. static int ptrace_set_debugreg(struct task_struct *child,
  434. int n, unsigned long data)
  435. {
  436. int i;
  437. if (unlikely(n == 4 || n == 5))
  438. return -EIO;
  439. if (n < 4 && unlikely(data >= debugreg_addr_limit(child)))
  440. return -EIO;
  441. switch (n) {
  442. case 0: child->thread.debugreg0 = data; break;
  443. case 1: child->thread.debugreg1 = data; break;
  444. case 2: child->thread.debugreg2 = data; break;
  445. case 3: child->thread.debugreg3 = data; break;
  446. case 6:
  447. if ((data & ~0xffffffffUL) != 0)
  448. return -EIO;
  449. child->thread.debugreg6 = data;
  450. break;
  451. case 7:
  452. /*
  453. * Sanity-check data. Take one half-byte at once with
  454. * check = (val >> (16 + 4*i)) & 0xf. It contains the
  455. * R/Wi and LENi bits; bits 0 and 1 are R/Wi, and bits
  456. * 2 and 3 are LENi. Given a list of invalid values,
  457. * we do mask |= 1 << invalid_value, so that
  458. * (mask >> check) & 1 is a correct test for invalid
  459. * values.
  460. *
  461. * R/Wi contains the type of the breakpoint /
  462. * watchpoint, LENi contains the length of the watched
  463. * data in the watchpoint case.
  464. *
  465. * The invalid values are:
  466. * - LENi == 0x10 (undefined), so mask |= 0x0f00. [32-bit]
  467. * - R/Wi == 0x10 (break on I/O reads or writes), so
  468. * mask |= 0x4444.
  469. * - R/Wi == 0x00 && LENi != 0x00, so we have mask |=
  470. * 0x1110.
  471. *
  472. * Finally, mask = 0x0f00 | 0x4444 | 0x1110 == 0x5f54.
  473. *
  474. * See the Intel Manual "System Programming Guide",
  475. * 15.2.4
  476. *
  477. * Note that LENi == 0x10 is defined on x86_64 in long
  478. * mode (i.e. even for 32-bit userspace software, but
  479. * 64-bit kernel), so the x86_64 mask value is 0x5454.
  480. * See the AMD manual no. 24593 (AMD64 System Programming)
  481. */
  482. #ifdef CONFIG_X86_32
  483. #define DR7_MASK 0x5f54
  484. #else
  485. #define DR7_MASK 0x5554
  486. #endif
  487. data &= ~DR_CONTROL_RESERVED;
  488. for (i = 0; i < 4; i++)
  489. if ((DR7_MASK >> ((data >> (16 + 4*i)) & 0xf)) & 1)
  490. return -EIO;
  491. child->thread.debugreg7 = data;
  492. if (data)
  493. set_tsk_thread_flag(child, TIF_DEBUG);
  494. else
  495. clear_tsk_thread_flag(child, TIF_DEBUG);
  496. break;
  497. }
  498. return 0;
  499. }
  500. /*
  501. * These access the current or another (stopped) task's io permission
  502. * bitmap for debugging or core dump.
  503. */
  504. static int ioperm_active(struct task_struct *target,
  505. const struct user_regset *regset)
  506. {
  507. return target->thread.io_bitmap_max / regset->size;
  508. }
  509. static int ioperm_get(struct task_struct *target,
  510. const struct user_regset *regset,
  511. unsigned int pos, unsigned int count,
  512. void *kbuf, void __user *ubuf)
  513. {
  514. if (!target->thread.io_bitmap_ptr)
  515. return -ENXIO;
  516. return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
  517. target->thread.io_bitmap_ptr,
  518. 0, IO_BITMAP_BYTES);
  519. }
  520. #ifdef CONFIG_X86_PTRACE_BTS
  521. /*
  522. * A branch trace store context.
  523. *
  524. * Contexts may only be installed by ptrace_bts_config() and only for
  525. * ptraced tasks.
  526. *
  527. * Contexts are destroyed when the tracee is detached from the tracer.
  528. * The actual destruction work requires interrupts enabled, so the
  529. * work is deferred and will be scheduled during __ptrace_unlink().
  530. *
  531. * Contexts hold an additional task_struct reference on the traced
  532. * task, as well as a reference on the tracer's mm.
  533. *
  534. * Ptrace already holds a task_struct for the duration of ptrace operations,
  535. * but since destruction is deferred, it may be executed after both
  536. * tracer and tracee exited.
  537. */
  538. struct bts_context {
  539. /* The branch trace handle. */
  540. struct bts_tracer *tracer;
  541. /* The buffer used to store the branch trace and its size. */
  542. void *buffer;
  543. unsigned int size;
  544. /* The mm that paid for the above buffer. */
  545. struct mm_struct *mm;
  546. /* The task this context belongs to. */
  547. struct task_struct *task;
  548. /* The signal to send on a bts buffer overflow. */
  549. unsigned int bts_ovfl_signal;
  550. /* The work struct to destroy a context. */
  551. struct work_struct work;
  552. };
  553. static int alloc_bts_buffer(struct bts_context *context, unsigned int size)
  554. {
  555. void *buffer = NULL;
  556. int err = -ENOMEM;
  557. err = account_locked_memory(current->mm, current->signal->rlim, size);
  558. if (err < 0)
  559. return err;
  560. buffer = kzalloc(size, GFP_KERNEL);
  561. if (!buffer)
  562. goto out_refund;
  563. context->buffer = buffer;
  564. context->size = size;
  565. context->mm = get_task_mm(current);
  566. return 0;
  567. out_refund:
  568. refund_locked_memory(current->mm, size);
  569. return err;
  570. }
  571. static inline void free_bts_buffer(struct bts_context *context)
  572. {
  573. if (!context->buffer)
  574. return;
  575. kfree(context->buffer);
  576. context->buffer = NULL;
  577. refund_locked_memory(context->mm, context->size);
  578. context->size = 0;
  579. mmput(context->mm);
  580. context->mm = NULL;
  581. }
  582. static void free_bts_context_work(struct work_struct *w)
  583. {
  584. struct bts_context *context;
  585. context = container_of(w, struct bts_context, work);
  586. ds_release_bts(context->tracer);
  587. put_task_struct(context->task);
  588. free_bts_buffer(context);
  589. kfree(context);
  590. }
  591. static inline void free_bts_context(struct bts_context *context)
  592. {
  593. INIT_WORK(&context->work, free_bts_context_work);
  594. schedule_work(&context->work);
  595. }
  596. static inline struct bts_context *alloc_bts_context(struct task_struct *task)
  597. {
  598. struct bts_context *context = kzalloc(sizeof(*context), GFP_KERNEL);
  599. if (context) {
  600. context->task = task;
  601. task->bts = context;
  602. get_task_struct(task);
  603. }
  604. return context;
  605. }
  606. static int ptrace_bts_read_record(struct task_struct *child, size_t index,
  607. struct bts_struct __user *out)
  608. {
  609. struct bts_context *context;
  610. const struct bts_trace *trace;
  611. struct bts_struct bts;
  612. const unsigned char *at;
  613. int error;
  614. context = child->bts;
  615. if (!context)
  616. return -ESRCH;
  617. trace = ds_read_bts(context->tracer);
  618. if (!trace)
  619. return -ESRCH;
  620. at = trace->ds.top - ((index + 1) * trace->ds.size);
  621. if ((void *)at < trace->ds.begin)
  622. at += (trace->ds.n * trace->ds.size);
  623. if (!trace->read)
  624. return -EOPNOTSUPP;
  625. error = trace->read(context->tracer, at, &bts);
  626. if (error < 0)
  627. return error;
  628. if (copy_to_user(out, &bts, sizeof(bts)))
  629. return -EFAULT;
  630. return sizeof(bts);
  631. }
  632. static int ptrace_bts_drain(struct task_struct *child,
  633. long size,
  634. struct bts_struct __user *out)
  635. {
  636. struct bts_context *context;
  637. const struct bts_trace *trace;
  638. const unsigned char *at;
  639. int error, drained = 0;
  640. context = child->bts;
  641. if (!context)
  642. return -ESRCH;
  643. trace = ds_read_bts(context->tracer);
  644. if (!trace)
  645. return -ESRCH;
  646. if (!trace->read)
  647. return -EOPNOTSUPP;
  648. if (size < (trace->ds.top - trace->ds.begin))
  649. return -EIO;
  650. for (at = trace->ds.begin; (void *)at < trace->ds.top;
  651. out++, drained++, at += trace->ds.size) {
  652. struct bts_struct bts;
  653. error = trace->read(context->tracer, at, &bts);
  654. if (error < 0)
  655. return error;
  656. if (copy_to_user(out, &bts, sizeof(bts)))
  657. return -EFAULT;
  658. }
  659. memset(trace->ds.begin, 0, trace->ds.n * trace->ds.size);
  660. error = ds_reset_bts(context->tracer);
  661. if (error < 0)
  662. return error;
  663. return drained;
  664. }
  665. static int ptrace_bts_config(struct task_struct *child,
  666. long cfg_size,
  667. const struct ptrace_bts_config __user *ucfg)
  668. {
  669. struct bts_context *context;
  670. struct ptrace_bts_config cfg;
  671. unsigned int flags = 0;
  672. if (cfg_size < sizeof(cfg))
  673. return -EIO;
  674. if (copy_from_user(&cfg, ucfg, sizeof(cfg)))
  675. return -EFAULT;
  676. context = child->bts;
  677. if (!context)
  678. context = alloc_bts_context(child);
  679. if (!context)
  680. return -ENOMEM;
  681. if (cfg.flags & PTRACE_BTS_O_SIGNAL) {
  682. if (!cfg.signal)
  683. return -EINVAL;
  684. return -EOPNOTSUPP;
  685. context->bts_ovfl_signal = cfg.signal;
  686. }
  687. ds_release_bts(context->tracer);
  688. context->tracer = NULL;
  689. if ((cfg.flags & PTRACE_BTS_O_ALLOC) && (cfg.size != context->size)) {
  690. int err;
  691. free_bts_buffer(context);
  692. if (!cfg.size)
  693. return 0;
  694. err = alloc_bts_buffer(context, cfg.size);
  695. if (err < 0)
  696. return err;
  697. }
  698. if (cfg.flags & PTRACE_BTS_O_TRACE)
  699. flags |= BTS_USER;
  700. if (cfg.flags & PTRACE_BTS_O_SCHED)
  701. flags |= BTS_TIMESTAMPS;
  702. context->tracer =
  703. ds_request_bts_task(child, context->buffer, context->size,
  704. NULL, (size_t)-1, flags);
  705. if (unlikely(IS_ERR(context->tracer))) {
  706. int error = PTR_ERR(context->tracer);
  707. free_bts_buffer(context);
  708. context->tracer = NULL;
  709. return error;
  710. }
  711. return sizeof(cfg);
  712. }
  713. static int ptrace_bts_status(struct task_struct *child,
  714. long cfg_size,
  715. struct ptrace_bts_config __user *ucfg)
  716. {
  717. struct bts_context *context;
  718. const struct bts_trace *trace;
  719. struct ptrace_bts_config cfg;
  720. context = child->bts;
  721. if (!context)
  722. return -ESRCH;
  723. if (cfg_size < sizeof(cfg))
  724. return -EIO;
  725. trace = ds_read_bts(context->tracer);
  726. if (!trace)
  727. return -ESRCH;
  728. memset(&cfg, 0, sizeof(cfg));
  729. cfg.size = trace->ds.end - trace->ds.begin;
  730. cfg.signal = context->bts_ovfl_signal;
  731. cfg.bts_size = sizeof(struct bts_struct);
  732. if (cfg.signal)
  733. cfg.flags |= PTRACE_BTS_O_SIGNAL;
  734. if (trace->ds.flags & BTS_USER)
  735. cfg.flags |= PTRACE_BTS_O_TRACE;
  736. if (trace->ds.flags & BTS_TIMESTAMPS)
  737. cfg.flags |= PTRACE_BTS_O_SCHED;
  738. if (copy_to_user(ucfg, &cfg, sizeof(cfg)))
  739. return -EFAULT;
  740. return sizeof(cfg);
  741. }
  742. static int ptrace_bts_clear(struct task_struct *child)
  743. {
  744. struct bts_context *context;
  745. const struct bts_trace *trace;
  746. context = child->bts;
  747. if (!context)
  748. return -ESRCH;
  749. trace = ds_read_bts(context->tracer);
  750. if (!trace)
  751. return -ESRCH;
  752. memset(trace->ds.begin, 0, trace->ds.n * trace->ds.size);
  753. return ds_reset_bts(context->tracer);
  754. }
  755. static int ptrace_bts_size(struct task_struct *child)
  756. {
  757. struct bts_context *context;
  758. const struct bts_trace *trace;
  759. context = child->bts;
  760. if (!context)
  761. return -ESRCH;
  762. trace = ds_read_bts(context->tracer);
  763. if (!trace)
  764. return -ESRCH;
  765. return (trace->ds.top - trace->ds.begin) / trace->ds.size;
  766. }
  767. /*
  768. * Called from __ptrace_unlink() after the child has been moved back
  769. * to its original parent.
  770. */
  771. void ptrace_bts_untrace(struct task_struct *child)
  772. {
  773. if (unlikely(child->bts)) {
  774. free_bts_context(child->bts);
  775. child->bts = NULL;
  776. }
  777. }
  778. #endif /* CONFIG_X86_PTRACE_BTS */
  779. /*
  780. * Called by kernel/ptrace.c when detaching..
  781. *
  782. * Make sure the single step bit is not set.
  783. */
  784. void ptrace_disable(struct task_struct *child)
  785. {
  786. user_disable_single_step(child);
  787. #ifdef TIF_SYSCALL_EMU
  788. clear_tsk_thread_flag(child, TIF_SYSCALL_EMU);
  789. #endif
  790. }
  791. #if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
  792. static const struct user_regset_view user_x86_32_view; /* Initialized below. */
  793. #endif
  794. long arch_ptrace(struct task_struct *child, long request, long addr, long data)
  795. {
  796. int ret;
  797. unsigned long __user *datap = (unsigned long __user *)data;
  798. switch (request) {
  799. /* read the word at location addr in the USER area. */
  800. case PTRACE_PEEKUSR: {
  801. unsigned long tmp;
  802. ret = -EIO;
  803. if ((addr & (sizeof(data) - 1)) || addr < 0 ||
  804. addr >= sizeof(struct user))
  805. break;
  806. tmp = 0; /* Default return condition */
  807. if (addr < sizeof(struct user_regs_struct))
  808. tmp = getreg(child, addr);
  809. else if (addr >= offsetof(struct user, u_debugreg[0]) &&
  810. addr <= offsetof(struct user, u_debugreg[7])) {
  811. addr -= offsetof(struct user, u_debugreg[0]);
  812. tmp = ptrace_get_debugreg(child, addr / sizeof(data));
  813. }
  814. ret = put_user(tmp, datap);
  815. break;
  816. }
  817. case PTRACE_POKEUSR: /* write the word at location addr in the USER area */
  818. ret = -EIO;
  819. if ((addr & (sizeof(data) - 1)) || addr < 0 ||
  820. addr >= sizeof(struct user))
  821. break;
  822. if (addr < sizeof(struct user_regs_struct))
  823. ret = putreg(child, addr, data);
  824. else if (addr >= offsetof(struct user, u_debugreg[0]) &&
  825. addr <= offsetof(struct user, u_debugreg[7])) {
  826. addr -= offsetof(struct user, u_debugreg[0]);
  827. ret = ptrace_set_debugreg(child,
  828. addr / sizeof(data), data);
  829. }
  830. break;
  831. case PTRACE_GETREGS: /* Get all gp regs from the child. */
  832. return copy_regset_to_user(child,
  833. task_user_regset_view(current),
  834. REGSET_GENERAL,
  835. 0, sizeof(struct user_regs_struct),
  836. datap);
  837. case PTRACE_SETREGS: /* Set all gp regs in the child. */
  838. return copy_regset_from_user(child,
  839. task_user_regset_view(current),
  840. REGSET_GENERAL,
  841. 0, sizeof(struct user_regs_struct),
  842. datap);
  843. case PTRACE_GETFPREGS: /* Get the child FPU state. */
  844. return copy_regset_to_user(child,
  845. task_user_regset_view(current),
  846. REGSET_FP,
  847. 0, sizeof(struct user_i387_struct),
  848. datap);
  849. case PTRACE_SETFPREGS: /* Set the child FPU state. */
  850. return copy_regset_from_user(child,
  851. task_user_regset_view(current),
  852. REGSET_FP,
  853. 0, sizeof(struct user_i387_struct),
  854. datap);
  855. #ifdef CONFIG_X86_32
  856. case PTRACE_GETFPXREGS: /* Get the child extended FPU state. */
  857. return copy_regset_to_user(child, &user_x86_32_view,
  858. REGSET_XFP,
  859. 0, sizeof(struct user_fxsr_struct),
  860. datap) ? -EIO : 0;
  861. case PTRACE_SETFPXREGS: /* Set the child extended FPU state. */
  862. return copy_regset_from_user(child, &user_x86_32_view,
  863. REGSET_XFP,
  864. 0, sizeof(struct user_fxsr_struct),
  865. datap) ? -EIO : 0;
  866. #endif
  867. #if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
  868. case PTRACE_GET_THREAD_AREA:
  869. if (addr < 0)
  870. return -EIO;
  871. ret = do_get_thread_area(child, addr,
  872. (struct user_desc __user *) data);
  873. break;
  874. case PTRACE_SET_THREAD_AREA:
  875. if (addr < 0)
  876. return -EIO;
  877. ret = do_set_thread_area(child, addr,
  878. (struct user_desc __user *) data, 0);
  879. break;
  880. #endif
  881. #ifdef CONFIG_X86_64
  882. /* normal 64bit interface to access TLS data.
  883. Works just like arch_prctl, except that the arguments
  884. are reversed. */
  885. case PTRACE_ARCH_PRCTL:
  886. ret = do_arch_prctl(child, data, addr);
  887. break;
  888. #endif
  889. /*
  890. * These bits need more cooking - not enabled yet:
  891. */
  892. #ifdef CONFIG_X86_PTRACE_BTS
  893. case PTRACE_BTS_CONFIG:
  894. ret = ptrace_bts_config
  895. (child, data, (struct ptrace_bts_config __user *)addr);
  896. break;
  897. case PTRACE_BTS_STATUS:
  898. ret = ptrace_bts_status
  899. (child, data, (struct ptrace_bts_config __user *)addr);
  900. break;
  901. case PTRACE_BTS_SIZE:
  902. ret = ptrace_bts_size(child);
  903. break;
  904. case PTRACE_BTS_GET:
  905. ret = ptrace_bts_read_record
  906. (child, data, (struct bts_struct __user *) addr);
  907. break;
  908. case PTRACE_BTS_CLEAR:
  909. ret = ptrace_bts_clear(child);
  910. break;
  911. case PTRACE_BTS_DRAIN:
  912. ret = ptrace_bts_drain
  913. (child, data, (struct bts_struct __user *) addr);
  914. break;
  915. #endif /* CONFIG_X86_PTRACE_BTS */
  916. default:
  917. ret = ptrace_request(child, request, addr, data);
  918. break;
  919. }
  920. return ret;
  921. }
  922. #ifdef CONFIG_IA32_EMULATION
  923. #include <linux/compat.h>
  924. #include <linux/syscalls.h>
  925. #include <asm/ia32.h>
  926. #include <asm/user32.h>
  927. #define R32(l,q) \
  928. case offsetof(struct user32, regs.l): \
  929. regs->q = value; break
  930. #define SEG32(rs) \
  931. case offsetof(struct user32, regs.rs): \
  932. return set_segment_reg(child, \
  933. offsetof(struct user_regs_struct, rs), \
  934. value); \
  935. break
  936. static int putreg32(struct task_struct *child, unsigned regno, u32 value)
  937. {
  938. struct pt_regs *regs = task_pt_regs(child);
  939. switch (regno) {
  940. SEG32(cs);
  941. SEG32(ds);
  942. SEG32(es);
  943. SEG32(fs);
  944. SEG32(gs);
  945. SEG32(ss);
  946. R32(ebx, bx);
  947. R32(ecx, cx);
  948. R32(edx, dx);
  949. R32(edi, di);
  950. R32(esi, si);
  951. R32(ebp, bp);
  952. R32(eax, ax);
  953. R32(eip, ip);
  954. R32(esp, sp);
  955. case offsetof(struct user32, regs.orig_eax):
  956. /*
  957. * Sign-extend the value so that orig_eax = -1
  958. * causes (long)orig_ax < 0 tests to fire correctly.
  959. */
  960. regs->orig_ax = (long) (s32) value;
  961. break;
  962. case offsetof(struct user32, regs.eflags):
  963. return set_flags(child, value);
  964. case offsetof(struct user32, u_debugreg[0]) ...
  965. offsetof(struct user32, u_debugreg[7]):
  966. regno -= offsetof(struct user32, u_debugreg[0]);
  967. return ptrace_set_debugreg(child, regno / 4, value);
  968. default:
  969. if (regno > sizeof(struct user32) || (regno & 3))
  970. return -EIO;
  971. /*
  972. * Other dummy fields in the virtual user structure
  973. * are ignored
  974. */
  975. break;
  976. }
  977. return 0;
  978. }
  979. #undef R32
  980. #undef SEG32
  981. #define R32(l,q) \
  982. case offsetof(struct user32, regs.l): \
  983. *val = regs->q; break
  984. #define SEG32(rs) \
  985. case offsetof(struct user32, regs.rs): \
  986. *val = get_segment_reg(child, \
  987. offsetof(struct user_regs_struct, rs)); \
  988. break
  989. static int getreg32(struct task_struct *child, unsigned regno, u32 *val)
  990. {
  991. struct pt_regs *regs = task_pt_regs(child);
  992. switch (regno) {
  993. SEG32(ds);
  994. SEG32(es);
  995. SEG32(fs);
  996. SEG32(gs);
  997. R32(cs, cs);
  998. R32(ss, ss);
  999. R32(ebx, bx);
  1000. R32(ecx, cx);
  1001. R32(edx, dx);
  1002. R32(edi, di);
  1003. R32(esi, si);
  1004. R32(ebp, bp);
  1005. R32(eax, ax);
  1006. R32(orig_eax, orig_ax);
  1007. R32(eip, ip);
  1008. R32(esp, sp);
  1009. case offsetof(struct user32, regs.eflags):
  1010. *val = get_flags(child);
  1011. break;
  1012. case offsetof(struct user32, u_debugreg[0]) ...
  1013. offsetof(struct user32, u_debugreg[7]):
  1014. regno -= offsetof(struct user32, u_debugreg[0]);
  1015. *val = ptrace_get_debugreg(child, regno / 4);
  1016. break;
  1017. default:
  1018. if (regno > sizeof(struct user32) || (regno & 3))
  1019. return -EIO;
  1020. /*
  1021. * Other dummy fields in the virtual user structure
  1022. * are ignored
  1023. */
  1024. *val = 0;
  1025. break;
  1026. }
  1027. return 0;
  1028. }
  1029. #undef R32
  1030. #undef SEG32
  1031. static int genregs32_get(struct task_struct *target,
  1032. const struct user_regset *regset,
  1033. unsigned int pos, unsigned int count,
  1034. void *kbuf, void __user *ubuf)
  1035. {
  1036. if (kbuf) {
  1037. compat_ulong_t *k = kbuf;
  1038. while (count > 0) {
  1039. getreg32(target, pos, k++);
  1040. count -= sizeof(*k);
  1041. pos += sizeof(*k);
  1042. }
  1043. } else {
  1044. compat_ulong_t __user *u = ubuf;
  1045. while (count > 0) {
  1046. compat_ulong_t word;
  1047. getreg32(target, pos, &word);
  1048. if (__put_user(word, u++))
  1049. return -EFAULT;
  1050. count -= sizeof(*u);
  1051. pos += sizeof(*u);
  1052. }
  1053. }
  1054. return 0;
  1055. }
  1056. static int genregs32_set(struct task_struct *target,
  1057. const struct user_regset *regset,
  1058. unsigned int pos, unsigned int count,
  1059. const void *kbuf, const void __user *ubuf)
  1060. {
  1061. int ret = 0;
  1062. if (kbuf) {
  1063. const compat_ulong_t *k = kbuf;
  1064. while (count > 0 && !ret) {
  1065. ret = putreg32(target, pos, *k++);
  1066. count -= sizeof(*k);
  1067. pos += sizeof(*k);
  1068. }
  1069. } else {
  1070. const compat_ulong_t __user *u = ubuf;
  1071. while (count > 0 && !ret) {
  1072. compat_ulong_t word;
  1073. ret = __get_user(word, u++);
  1074. if (ret)
  1075. break;
  1076. ret = putreg32(target, pos, word);
  1077. count -= sizeof(*u);
  1078. pos += sizeof(*u);
  1079. }
  1080. }
  1081. return ret;
  1082. }
  1083. long compat_arch_ptrace(struct task_struct *child, compat_long_t request,
  1084. compat_ulong_t caddr, compat_ulong_t cdata)
  1085. {
  1086. unsigned long addr = caddr;
  1087. unsigned long data = cdata;
  1088. void __user *datap = compat_ptr(data);
  1089. int ret;
  1090. __u32 val;
  1091. switch (request) {
  1092. case PTRACE_PEEKUSR:
  1093. ret = getreg32(child, addr, &val);
  1094. if (ret == 0)
  1095. ret = put_user(val, (__u32 __user *)datap);
  1096. break;
  1097. case PTRACE_POKEUSR:
  1098. ret = putreg32(child, addr, data);
  1099. break;
  1100. case PTRACE_GETREGS: /* Get all gp regs from the child. */
  1101. return copy_regset_to_user(child, &user_x86_32_view,
  1102. REGSET_GENERAL,
  1103. 0, sizeof(struct user_regs_struct32),
  1104. datap);
  1105. case PTRACE_SETREGS: /* Set all gp regs in the child. */
  1106. return copy_regset_from_user(child, &user_x86_32_view,
  1107. REGSET_GENERAL, 0,
  1108. sizeof(struct user_regs_struct32),
  1109. datap);
  1110. case PTRACE_GETFPREGS: /* Get the child FPU state. */
  1111. return copy_regset_to_user(child, &user_x86_32_view,
  1112. REGSET_FP, 0,
  1113. sizeof(struct user_i387_ia32_struct),
  1114. datap);
  1115. case PTRACE_SETFPREGS: /* Set the child FPU state. */
  1116. return copy_regset_from_user(
  1117. child, &user_x86_32_view, REGSET_FP,
  1118. 0, sizeof(struct user_i387_ia32_struct), datap);
  1119. case PTRACE_GETFPXREGS: /* Get the child extended FPU state. */
  1120. return copy_regset_to_user(child, &user_x86_32_view,
  1121. REGSET_XFP, 0,
  1122. sizeof(struct user32_fxsr_struct),
  1123. datap);
  1124. case PTRACE_SETFPXREGS: /* Set the child extended FPU state. */
  1125. return copy_regset_from_user(child, &user_x86_32_view,
  1126. REGSET_XFP, 0,
  1127. sizeof(struct user32_fxsr_struct),
  1128. datap);
  1129. case PTRACE_GET_THREAD_AREA:
  1130. case PTRACE_SET_THREAD_AREA:
  1131. #ifdef CONFIG_X86_PTRACE_BTS
  1132. case PTRACE_BTS_CONFIG:
  1133. case PTRACE_BTS_STATUS:
  1134. case PTRACE_BTS_SIZE:
  1135. case PTRACE_BTS_GET:
  1136. case PTRACE_BTS_CLEAR:
  1137. case PTRACE_BTS_DRAIN:
  1138. #endif /* CONFIG_X86_PTRACE_BTS */
  1139. return arch_ptrace(child, request, addr, data);
  1140. default:
  1141. return compat_ptrace_request(child, request, addr, data);
  1142. }
  1143. return ret;
  1144. }
  1145. #endif /* CONFIG_IA32_EMULATION */
  1146. #ifdef CONFIG_X86_64
  1147. static const struct user_regset x86_64_regsets[] = {
  1148. [REGSET_GENERAL] = {
  1149. .core_note_type = NT_PRSTATUS,
  1150. .n = sizeof(struct user_regs_struct) / sizeof(long),
  1151. .size = sizeof(long), .align = sizeof(long),
  1152. .get = genregs_get, .set = genregs_set
  1153. },
  1154. [REGSET_FP] = {
  1155. .core_note_type = NT_PRFPREG,
  1156. .n = sizeof(struct user_i387_struct) / sizeof(long),
  1157. .size = sizeof(long), .align = sizeof(long),
  1158. .active = xfpregs_active, .get = xfpregs_get, .set = xfpregs_set
  1159. },
  1160. [REGSET_IOPERM64] = {
  1161. .core_note_type = NT_386_IOPERM,
  1162. .n = IO_BITMAP_LONGS,
  1163. .size = sizeof(long), .align = sizeof(long),
  1164. .active = ioperm_active, .get = ioperm_get
  1165. },
  1166. };
  1167. static const struct user_regset_view user_x86_64_view = {
  1168. .name = "x86_64", .e_machine = EM_X86_64,
  1169. .regsets = x86_64_regsets, .n = ARRAY_SIZE(x86_64_regsets)
  1170. };
  1171. #else /* CONFIG_X86_32 */
  1172. #define user_regs_struct32 user_regs_struct
  1173. #define genregs32_get genregs_get
  1174. #define genregs32_set genregs_set
  1175. #define user_i387_ia32_struct user_i387_struct
  1176. #define user32_fxsr_struct user_fxsr_struct
  1177. #endif /* CONFIG_X86_64 */
  1178. #if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
  1179. static const struct user_regset x86_32_regsets[] = {
  1180. [REGSET_GENERAL] = {
  1181. .core_note_type = NT_PRSTATUS,
  1182. .n = sizeof(struct user_regs_struct32) / sizeof(u32),
  1183. .size = sizeof(u32), .align = sizeof(u32),
  1184. .get = genregs32_get, .set = genregs32_set
  1185. },
  1186. [REGSET_FP] = {
  1187. .core_note_type = NT_PRFPREG,
  1188. .n = sizeof(struct user_i387_ia32_struct) / sizeof(u32),
  1189. .size = sizeof(u32), .align = sizeof(u32),
  1190. .active = fpregs_active, .get = fpregs_get, .set = fpregs_set
  1191. },
  1192. [REGSET_XFP] = {
  1193. .core_note_type = NT_PRXFPREG,
  1194. .n = sizeof(struct user32_fxsr_struct) / sizeof(u32),
  1195. .size = sizeof(u32), .align = sizeof(u32),
  1196. .active = xfpregs_active, .get = xfpregs_get, .set = xfpregs_set
  1197. },
  1198. [REGSET_TLS] = {
  1199. .core_note_type = NT_386_TLS,
  1200. .n = GDT_ENTRY_TLS_ENTRIES, .bias = GDT_ENTRY_TLS_MIN,
  1201. .size = sizeof(struct user_desc),
  1202. .align = sizeof(struct user_desc),
  1203. .active = regset_tls_active,
  1204. .get = regset_tls_get, .set = regset_tls_set
  1205. },
  1206. [REGSET_IOPERM32] = {
  1207. .core_note_type = NT_386_IOPERM,
  1208. .n = IO_BITMAP_BYTES / sizeof(u32),
  1209. .size = sizeof(u32), .align = sizeof(u32),
  1210. .active = ioperm_active, .get = ioperm_get
  1211. },
  1212. };
  1213. static const struct user_regset_view user_x86_32_view = {
  1214. .name = "i386", .e_machine = EM_386,
  1215. .regsets = x86_32_regsets, .n = ARRAY_SIZE(x86_32_regsets)
  1216. };
  1217. #endif
  1218. const struct user_regset_view *task_user_regset_view(struct task_struct *task)
  1219. {
  1220. #ifdef CONFIG_IA32_EMULATION
  1221. if (test_tsk_thread_flag(task, TIF_IA32))
  1222. #endif
  1223. #if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
  1224. return &user_x86_32_view;
  1225. #endif
  1226. #ifdef CONFIG_X86_64
  1227. return &user_x86_64_view;
  1228. #endif
  1229. }
  1230. void send_sigtrap(struct task_struct *tsk, struct pt_regs *regs,
  1231. int error_code, int si_code)
  1232. {
  1233. struct siginfo info;
  1234. tsk->thread.trap_no = 1;
  1235. tsk->thread.error_code = error_code;
  1236. memset(&info, 0, sizeof(info));
  1237. info.si_signo = SIGTRAP;
  1238. info.si_code = si_code;
  1239. /* User-mode ip? */
  1240. info.si_addr = user_mode_vm(regs) ? (void __user *) regs->ip : NULL;
  1241. /* Send us the fake SIGTRAP */
  1242. force_sig_info(SIGTRAP, &info, tsk);
  1243. }
  1244. #ifdef CONFIG_X86_32
  1245. # define IS_IA32 1
  1246. #elif defined CONFIG_IA32_EMULATION
  1247. # define IS_IA32 is_compat_task()
  1248. #else
  1249. # define IS_IA32 0
  1250. #endif
  1251. /*
  1252. * We must return the syscall number to actually look up in the table.
  1253. * This can be -1L to skip running any syscall at all.
  1254. */
  1255. asmregparm long syscall_trace_enter(struct pt_regs *regs)
  1256. {
  1257. long ret = 0;
  1258. /*
  1259. * If we stepped into a sysenter/syscall insn, it trapped in
  1260. * kernel mode; do_debug() cleared TF and set TIF_SINGLESTEP.
  1261. * If user-mode had set TF itself, then it's still clear from
  1262. * do_debug() and we need to set it again to restore the user
  1263. * state. If we entered on the slow path, TF was already set.
  1264. */
  1265. if (test_thread_flag(TIF_SINGLESTEP))
  1266. regs->flags |= X86_EFLAGS_TF;
  1267. /* do the secure computing check first */
  1268. secure_computing(regs->orig_ax);
  1269. if (unlikely(test_thread_flag(TIF_SYSCALL_EMU)))
  1270. ret = -1L;
  1271. if ((ret || test_thread_flag(TIF_SYSCALL_TRACE)) &&
  1272. tracehook_report_syscall_entry(regs))
  1273. ret = -1L;
  1274. if (unlikely(test_thread_flag(TIF_SYSCALL_FTRACE)))
  1275. ftrace_syscall_enter(regs);
  1276. if (unlikely(current->audit_context)) {
  1277. if (IS_IA32)
  1278. audit_syscall_entry(AUDIT_ARCH_I386,
  1279. regs->orig_ax,
  1280. regs->bx, regs->cx,
  1281. regs->dx, regs->si);
  1282. #ifdef CONFIG_X86_64
  1283. else
  1284. audit_syscall_entry(AUDIT_ARCH_X86_64,
  1285. regs->orig_ax,
  1286. regs->di, regs->si,
  1287. regs->dx, regs->r10);
  1288. #endif
  1289. }
  1290. return ret ?: regs->orig_ax;
  1291. }
  1292. asmregparm void syscall_trace_leave(struct pt_regs *regs)
  1293. {
  1294. if (unlikely(current->audit_context))
  1295. audit_syscall_exit(AUDITSC_RESULT(regs->ax), regs->ax);
  1296. if (unlikely(test_thread_flag(TIF_SYSCALL_FTRACE)))
  1297. ftrace_syscall_exit(regs);
  1298. if (test_thread_flag(TIF_SYSCALL_TRACE))
  1299. tracehook_report_syscall_exit(regs, 0);
  1300. /*
  1301. * If TIF_SYSCALL_EMU is set, we only get here because of
  1302. * TIF_SINGLESTEP (i.e. this is PTRACE_SYSEMU_SINGLESTEP).
  1303. * We already reported this syscall instruction in
  1304. * syscall_trace_enter(), so don't do any more now.
  1305. */
  1306. if (unlikely(test_thread_flag(TIF_SYSCALL_EMU)))
  1307. return;
  1308. /*
  1309. * If we are single-stepping, synthesize a trap to follow the
  1310. * system call instruction.
  1311. */
  1312. if (test_thread_flag(TIF_SINGLESTEP) &&
  1313. tracehook_consider_fatal_signal(current, SIGTRAP))
  1314. send_sigtrap(current, regs, 0, TRAP_BRKPT);
  1315. }