ia32entry.S 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498
  1. /*
  2. * Compatibility mode system call entry point for x86-64.
  3. *
  4. * Copyright 2000-2002 Andi Kleen, SuSE Labs.
  5. */
  6. #include <asm/dwarf2.h>
  7. #include <asm/calling.h>
  8. #include <asm/asm-offsets.h>
  9. #include <asm/current.h>
  10. #include <asm/errno.h>
  11. #include <asm/ia32_unistd.h>
  12. #include <asm/thread_info.h>
  13. #include <asm/segment.h>
  14. #include <asm/irqflags.h>
  15. #include <asm/asm.h>
  16. #include <asm/smap.h>
  17. #include <linux/linkage.h>
  18. #include <linux/err.h>
  19. /* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this. */
  20. #include <linux/elf-em.h>
  21. #define AUDIT_ARCH_I386 (EM_386|__AUDIT_ARCH_LE)
  22. #define __AUDIT_ARCH_LE 0x40000000
  23. #ifndef CONFIG_AUDITSYSCALL
  24. #define sysexit_audit ia32_ret_from_sys_call
  25. #define sysretl_audit ia32_ret_from_sys_call
  26. #endif
  27. .section .entry.text, "ax"
  28. .macro IA32_ARG_FIXUP noebp=0
  29. movl %edi,%r8d
  30. .if \noebp
  31. .else
  32. movl %ebp,%r9d
  33. .endif
  34. xchg %ecx,%esi
  35. movl %ebx,%edi
  36. movl %edx,%edx /* zero extension */
  37. .endm
  38. /* clobbers %eax */
  39. .macro CLEAR_RREGS offset=0, _r9=rax
  40. xorl %eax,%eax
  41. movq %rax,\offset+R11(%rsp)
  42. movq %rax,\offset+R10(%rsp)
  43. movq %\_r9,\offset+R9(%rsp)
  44. movq %rax,\offset+R8(%rsp)
  45. .endm
  46. /*
  47. * Reload arg registers from stack in case ptrace changed them.
  48. * We don't reload %eax because syscall_trace_enter() returned
  49. * the %rax value we should see. Instead, we just truncate that
  50. * value to 32 bits again as we did on entry from user mode.
  51. * If it's a new value set by user_regset during entry tracing,
  52. * this matches the normal truncation of the user-mode value.
  53. * If it's -1 to make us punt the syscall, then (u32)-1 is still
  54. * an appropriately invalid value.
  55. */
  56. .macro LOAD_ARGS32 offset, _r9=0
  57. .if \_r9
  58. movl \offset+16(%rsp),%r9d
  59. .endif
  60. movl \offset+40(%rsp),%ecx
  61. movl \offset+48(%rsp),%edx
  62. movl \offset+56(%rsp),%esi
  63. movl \offset+64(%rsp),%edi
  64. movl %eax,%eax /* zero extension */
  65. .endm
  66. .macro CFI_STARTPROC32 simple
  67. CFI_STARTPROC \simple
  68. CFI_UNDEFINED r8
  69. CFI_UNDEFINED r9
  70. CFI_UNDEFINED r10
  71. CFI_UNDEFINED r11
  72. CFI_UNDEFINED r12
  73. CFI_UNDEFINED r13
  74. CFI_UNDEFINED r14
  75. CFI_UNDEFINED r15
  76. .endm
  77. #ifdef CONFIG_PARAVIRT
  78. ENTRY(native_usergs_sysret32)
  79. swapgs
  80. sysretl
  81. ENDPROC(native_usergs_sysret32)
  82. ENTRY(native_irq_enable_sysexit)
  83. swapgs
  84. sti
  85. sysexit
  86. ENDPROC(native_irq_enable_sysexit)
  87. #endif
  88. /*
  89. * 32bit SYSENTER instruction entry.
  90. *
  91. * Arguments:
  92. * %eax System call number.
  93. * %ebx Arg1
  94. * %ecx Arg2
  95. * %edx Arg3
  96. * %esi Arg4
  97. * %edi Arg5
  98. * %ebp user stack
  99. * 0(%ebp) Arg6
  100. *
  101. * Interrupts off.
  102. *
  103. * This is purely a fast path. For anything complicated we use the int 0x80
  104. * path below. Set up a complete hardware stack frame to share code
  105. * with the int 0x80 path.
  106. */
  107. ENTRY(ia32_sysenter_target)
  108. CFI_STARTPROC32 simple
  109. CFI_SIGNAL_FRAME
  110. CFI_DEF_CFA rsp,0
  111. CFI_REGISTER rsp,rbp
  112. SWAPGS_UNSAFE_STACK
  113. movq PER_CPU_VAR(kernel_stack), %rsp
  114. addq $(KERNEL_STACK_OFFSET),%rsp
  115. /*
  116. * No need to follow this irqs on/off section: the syscall
  117. * disabled irqs, here we enable it straight after entry:
  118. */
  119. ENABLE_INTERRUPTS(CLBR_NONE)
  120. movl %ebp,%ebp /* zero extension */
  121. pushq_cfi $__USER32_DS
  122. /*CFI_REL_OFFSET ss,0*/
  123. pushq_cfi %rbp
  124. CFI_REL_OFFSET rsp,0
  125. pushfq_cfi
  126. /*CFI_REL_OFFSET rflags,0*/
  127. movl TI_sysenter_return+THREAD_INFO(%rsp,3*8-KERNEL_STACK_OFFSET),%r10d
  128. CFI_REGISTER rip,r10
  129. pushq_cfi $__USER32_CS
  130. /*CFI_REL_OFFSET cs,0*/
  131. movl %eax, %eax
  132. pushq_cfi %r10
  133. CFI_REL_OFFSET rip,0
  134. pushq_cfi %rax
  135. cld
  136. SAVE_ARGS 0,1,0
  137. /* no need to do an access_ok check here because rbp has been
  138. 32bit zero extended */
  139. ASM_STAC
  140. 1: movl (%rbp),%ebp
  141. _ASM_EXTABLE(1b,ia32_badarg)
  142. ASM_CLAC
  143. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  144. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  145. CFI_REMEMBER_STATE
  146. jnz sysenter_tracesys
  147. cmpq $(IA32_NR_syscalls-1),%rax
  148. ja ia32_badsys
  149. sysenter_do_call:
  150. IA32_ARG_FIXUP
  151. sysenter_dispatch:
  152. call *ia32_sys_call_table(,%rax,8)
  153. movq %rax,RAX-ARGOFFSET(%rsp)
  154. DISABLE_INTERRUPTS(CLBR_NONE)
  155. TRACE_IRQS_OFF
  156. testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  157. jnz sysexit_audit
  158. sysexit_from_sys_call:
  159. andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  160. /* clear IF, that popfq doesn't enable interrupts early */
  161. andl $~0x200,EFLAGS-R11(%rsp)
  162. movl RIP-R11(%rsp),%edx /* User %eip */
  163. CFI_REGISTER rip,rdx
  164. RESTORE_ARGS 0,24,0,0,0,0
  165. xorq %r8,%r8
  166. xorq %r9,%r9
  167. xorq %r10,%r10
  168. xorq %r11,%r11
  169. popfq_cfi
  170. /*CFI_RESTORE rflags*/
  171. popq_cfi %rcx /* User %esp */
  172. CFI_REGISTER rsp,rcx
  173. TRACE_IRQS_ON
  174. ENABLE_INTERRUPTS_SYSEXIT32
  175. #ifdef CONFIG_AUDITSYSCALL
  176. .macro auditsys_entry_common
  177. movl %esi,%r9d /* 6th arg: 4th syscall arg */
  178. movl %edx,%r8d /* 5th arg: 3rd syscall arg */
  179. /* (already in %ecx) 4th arg: 2nd syscall arg */
  180. movl %ebx,%edx /* 3rd arg: 1st syscall arg */
  181. movl %eax,%esi /* 2nd arg: syscall number */
  182. movl $AUDIT_ARCH_I386,%edi /* 1st arg: audit arch */
  183. call __audit_syscall_entry
  184. movl RAX-ARGOFFSET(%rsp),%eax /* reload syscall number */
  185. cmpq $(IA32_NR_syscalls-1),%rax
  186. ja ia32_badsys
  187. movl %ebx,%edi /* reload 1st syscall arg */
  188. movl RCX-ARGOFFSET(%rsp),%esi /* reload 2nd syscall arg */
  189. movl RDX-ARGOFFSET(%rsp),%edx /* reload 3rd syscall arg */
  190. movl RSI-ARGOFFSET(%rsp),%ecx /* reload 4th syscall arg */
  191. movl RDI-ARGOFFSET(%rsp),%r8d /* reload 5th syscall arg */
  192. .endm
  193. .macro auditsys_exit exit
  194. testl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  195. jnz ia32_ret_from_sys_call
  196. TRACE_IRQS_ON
  197. ENABLE_INTERRUPTS(CLBR_NONE)
  198. movl %eax,%esi /* second arg, syscall return value */
  199. cmpl $-MAX_ERRNO,%eax /* is it an error ? */
  200. jbe 1f
  201. movslq %eax, %rsi /* if error sign extend to 64 bits */
  202. 1: setbe %al /* 1 if error, 0 if not */
  203. movzbl %al,%edi /* zero-extend that into %edi */
  204. call __audit_syscall_exit
  205. movq RAX-ARGOFFSET(%rsp),%rax /* reload syscall return value */
  206. movl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),%edi
  207. DISABLE_INTERRUPTS(CLBR_NONE)
  208. TRACE_IRQS_OFF
  209. testl %edi,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  210. jz \exit
  211. CLEAR_RREGS -ARGOFFSET
  212. jmp int_with_check
  213. .endm
  214. sysenter_auditsys:
  215. CFI_RESTORE_STATE
  216. auditsys_entry_common
  217. movl %ebp,%r9d /* reload 6th syscall arg */
  218. jmp sysenter_dispatch
  219. sysexit_audit:
  220. auditsys_exit sysexit_from_sys_call
  221. #endif
  222. sysenter_tracesys:
  223. #ifdef CONFIG_AUDITSYSCALL
  224. testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  225. jz sysenter_auditsys
  226. #endif
  227. SAVE_REST
  228. CLEAR_RREGS
  229. movq $-ENOSYS,RAX(%rsp)/* ptrace can change this for a bad syscall */
  230. movq %rsp,%rdi /* &pt_regs -> arg1 */
  231. call syscall_trace_enter
  232. LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
  233. RESTORE_REST
  234. cmpq $(IA32_NR_syscalls-1),%rax
  235. ja int_ret_from_sys_call /* sysenter_tracesys has set RAX(%rsp) */
  236. jmp sysenter_do_call
  237. CFI_ENDPROC
  238. ENDPROC(ia32_sysenter_target)
  239. /*
  240. * 32bit SYSCALL instruction entry.
  241. *
  242. * Arguments:
  243. * %eax System call number.
  244. * %ebx Arg1
  245. * %ecx return EIP
  246. * %edx Arg3
  247. * %esi Arg4
  248. * %edi Arg5
  249. * %ebp Arg2 [note: not saved in the stack frame, should not be touched]
  250. * %esp user stack
  251. * 0(%esp) Arg6
  252. *
  253. * Interrupts off.
  254. *
  255. * This is purely a fast path. For anything complicated we use the int 0x80
  256. * path below. Set up a complete hardware stack frame to share code
  257. * with the int 0x80 path.
  258. */
  259. ENTRY(ia32_cstar_target)
  260. CFI_STARTPROC32 simple
  261. CFI_SIGNAL_FRAME
  262. CFI_DEF_CFA rsp,KERNEL_STACK_OFFSET
  263. CFI_REGISTER rip,rcx
  264. /*CFI_REGISTER rflags,r11*/
  265. SWAPGS_UNSAFE_STACK
  266. movl %esp,%r8d
  267. CFI_REGISTER rsp,r8
  268. movq PER_CPU_VAR(kernel_stack),%rsp
  269. /*
  270. * No need to follow this irqs on/off section: the syscall
  271. * disabled irqs and here we enable it straight after entry:
  272. */
  273. ENABLE_INTERRUPTS(CLBR_NONE)
  274. SAVE_ARGS 8,0,0
  275. movl %eax,%eax /* zero extension */
  276. movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
  277. movq %rcx,RIP-ARGOFFSET(%rsp)
  278. CFI_REL_OFFSET rip,RIP-ARGOFFSET
  279. movq %rbp,RCX-ARGOFFSET(%rsp) /* this lies slightly to ptrace */
  280. movl %ebp,%ecx
  281. movq $__USER32_CS,CS-ARGOFFSET(%rsp)
  282. movq $__USER32_DS,SS-ARGOFFSET(%rsp)
  283. movq %r11,EFLAGS-ARGOFFSET(%rsp)
  284. /*CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
  285. movq %r8,RSP-ARGOFFSET(%rsp)
  286. CFI_REL_OFFSET rsp,RSP-ARGOFFSET
  287. /* no need to do an access_ok check here because r8 has been
  288. 32bit zero extended */
  289. /* hardware stack frame is complete now */
  290. ASM_STAC
  291. 1: movl (%r8),%r9d
  292. _ASM_EXTABLE(1b,ia32_badarg)
  293. ASM_CLAC
  294. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  295. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  296. CFI_REMEMBER_STATE
  297. jnz cstar_tracesys
  298. cmpq $IA32_NR_syscalls-1,%rax
  299. ja ia32_badsys
  300. cstar_do_call:
  301. IA32_ARG_FIXUP 1
  302. cstar_dispatch:
  303. call *ia32_sys_call_table(,%rax,8)
  304. movq %rax,RAX-ARGOFFSET(%rsp)
  305. DISABLE_INTERRUPTS(CLBR_NONE)
  306. TRACE_IRQS_OFF
  307. testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  308. jnz sysretl_audit
  309. sysretl_from_sys_call:
  310. andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  311. RESTORE_ARGS 0,-ARG_SKIP,0,0,0
  312. movl RIP-ARGOFFSET(%rsp),%ecx
  313. CFI_REGISTER rip,rcx
  314. movl EFLAGS-ARGOFFSET(%rsp),%r11d
  315. /*CFI_REGISTER rflags,r11*/
  316. xorq %r10,%r10
  317. xorq %r9,%r9
  318. xorq %r8,%r8
  319. TRACE_IRQS_ON
  320. movl RSP-ARGOFFSET(%rsp),%esp
  321. CFI_RESTORE rsp
  322. USERGS_SYSRET32
  323. #ifdef CONFIG_AUDITSYSCALL
  324. cstar_auditsys:
  325. CFI_RESTORE_STATE
  326. movl %r9d,R9-ARGOFFSET(%rsp) /* register to be clobbered by call */
  327. auditsys_entry_common
  328. movl R9-ARGOFFSET(%rsp),%r9d /* reload 6th syscall arg */
  329. jmp cstar_dispatch
  330. sysretl_audit:
  331. auditsys_exit sysretl_from_sys_call
  332. #endif
  333. cstar_tracesys:
  334. #ifdef CONFIG_AUDITSYSCALL
  335. testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  336. jz cstar_auditsys
  337. #endif
  338. xchgl %r9d,%ebp
  339. SAVE_REST
  340. CLEAR_RREGS 0, r9
  341. movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
  342. movq %rsp,%rdi /* &pt_regs -> arg1 */
  343. call syscall_trace_enter
  344. LOAD_ARGS32 ARGOFFSET, 1 /* reload args from stack in case ptrace changed it */
  345. RESTORE_REST
  346. xchgl %ebp,%r9d
  347. cmpq $(IA32_NR_syscalls-1),%rax
  348. ja int_ret_from_sys_call /* cstar_tracesys has set RAX(%rsp) */
  349. jmp cstar_do_call
  350. END(ia32_cstar_target)
  351. ia32_badarg:
  352. ASM_CLAC
  353. movq $-EFAULT,%rax
  354. jmp ia32_sysret
  355. CFI_ENDPROC
  356. /*
  357. * Emulated IA32 system calls via int 0x80.
  358. *
  359. * Arguments:
  360. * %eax System call number.
  361. * %ebx Arg1
  362. * %ecx Arg2
  363. * %edx Arg3
  364. * %esi Arg4
  365. * %edi Arg5
  366. * %ebp Arg6 [note: not saved in the stack frame, should not be touched]
  367. *
  368. * Notes:
  369. * Uses the same stack frame as the x86-64 version.
  370. * All registers except %eax must be saved (but ptrace may violate that)
  371. * Arguments are zero extended. For system calls that want sign extension and
  372. * take long arguments a wrapper is needed. Most calls can just be called
  373. * directly.
  374. * Assumes it is only called from user space and entered with interrupts off.
  375. */
  376. ENTRY(ia32_syscall)
  377. CFI_STARTPROC32 simple
  378. CFI_SIGNAL_FRAME
  379. CFI_DEF_CFA rsp,SS+8-RIP
  380. /*CFI_REL_OFFSET ss,SS-RIP*/
  381. CFI_REL_OFFSET rsp,RSP-RIP
  382. /*CFI_REL_OFFSET rflags,EFLAGS-RIP*/
  383. /*CFI_REL_OFFSET cs,CS-RIP*/
  384. CFI_REL_OFFSET rip,RIP-RIP
  385. PARAVIRT_ADJUST_EXCEPTION_FRAME
  386. SWAPGS
  387. /*
  388. * No need to follow this irqs on/off section: the syscall
  389. * disabled irqs and here we enable it straight after entry:
  390. */
  391. ENABLE_INTERRUPTS(CLBR_NONE)
  392. movl %eax,%eax
  393. pushq_cfi %rax
  394. cld
  395. /* note the registers are not zero extended to the sf.
  396. this could be a problem. */
  397. SAVE_ARGS 0,1,0
  398. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  399. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  400. jnz ia32_tracesys
  401. cmpq $(IA32_NR_syscalls-1),%rax
  402. ja ia32_badsys
  403. ia32_do_call:
  404. IA32_ARG_FIXUP
  405. call *ia32_sys_call_table(,%rax,8) # xxx: rip relative
  406. ia32_sysret:
  407. movq %rax,RAX-ARGOFFSET(%rsp)
  408. ia32_ret_from_sys_call:
  409. CLEAR_RREGS -ARGOFFSET
  410. jmp int_ret_from_sys_call
  411. ia32_tracesys:
  412. SAVE_REST
  413. CLEAR_RREGS
  414. movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
  415. movq %rsp,%rdi /* &pt_regs -> arg1 */
  416. call syscall_trace_enter
  417. LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
  418. RESTORE_REST
  419. cmpq $(IA32_NR_syscalls-1),%rax
  420. ja int_ret_from_sys_call /* ia32_tracesys has set RAX(%rsp) */
  421. jmp ia32_do_call
  422. END(ia32_syscall)
  423. ia32_badsys:
  424. movq $0,ORIG_RAX-ARGOFFSET(%rsp)
  425. movq $-ENOSYS,%rax
  426. jmp ia32_sysret
  427. CFI_ENDPROC
  428. .macro PTREGSCALL label, func, arg
  429. ALIGN
  430. GLOBAL(\label)
  431. leaq \func(%rip),%rax
  432. jmp ia32_ptregs_common
  433. .endm
  434. CFI_STARTPROC32
  435. PTREGSCALL stub32_rt_sigreturn, sys32_rt_sigreturn
  436. PTREGSCALL stub32_sigreturn, sys32_sigreturn
  437. PTREGSCALL stub32_execve, compat_sys_execve
  438. PTREGSCALL stub32_fork, sys_fork
  439. PTREGSCALL stub32_vfork, sys_vfork
  440. ALIGN
  441. GLOBAL(stub32_clone)
  442. leaq sys_clone(%rip),%rax
  443. mov %r8, %rcx
  444. jmp ia32_ptregs_common
  445. ALIGN
  446. ia32_ptregs_common:
  447. popq %r11
  448. CFI_ENDPROC
  449. CFI_STARTPROC32 simple
  450. CFI_SIGNAL_FRAME
  451. CFI_DEF_CFA rsp,SS+8-ARGOFFSET
  452. CFI_REL_OFFSET rax,RAX-ARGOFFSET
  453. CFI_REL_OFFSET rcx,RCX-ARGOFFSET
  454. CFI_REL_OFFSET rdx,RDX-ARGOFFSET
  455. CFI_REL_OFFSET rsi,RSI-ARGOFFSET
  456. CFI_REL_OFFSET rdi,RDI-ARGOFFSET
  457. CFI_REL_OFFSET rip,RIP-ARGOFFSET
  458. /* CFI_REL_OFFSET cs,CS-ARGOFFSET*/
  459. /* CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
  460. CFI_REL_OFFSET rsp,RSP-ARGOFFSET
  461. /* CFI_REL_OFFSET ss,SS-ARGOFFSET*/
  462. SAVE_REST
  463. call *%rax
  464. RESTORE_REST
  465. jmp ia32_sysret /* misbalances the return cache */
  466. CFI_ENDPROC
  467. END(ia32_ptregs_common)