ia32entry.S 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490
  1. /*
  2. * Compatibility mode system call entry point for x86-64.
  3. *
  4. * Copyright 2000-2002 Andi Kleen, SuSE Labs.
  5. */
  6. #include <asm/dwarf2.h>
  7. #include <asm/calling.h>
  8. #include <asm/asm-offsets.h>
  9. #include <asm/current.h>
  10. #include <asm/errno.h>
  11. #include <asm/ia32_unistd.h>
  12. #include <asm/thread_info.h>
  13. #include <asm/segment.h>
  14. #include <asm/irqflags.h>
  15. #include <asm/asm.h>
  16. #include <linux/linkage.h>
  17. #include <linux/err.h>
  18. /* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this. */
  19. #include <linux/elf-em.h>
  20. #define AUDIT_ARCH_I386 (EM_386|__AUDIT_ARCH_LE)
  21. #define __AUDIT_ARCH_LE 0x40000000
  22. #ifndef CONFIG_AUDITSYSCALL
  23. #define sysexit_audit ia32_ret_from_sys_call
  24. #define sysretl_audit ia32_ret_from_sys_call
  25. #endif
  26. .section .entry.text, "ax"
  27. .macro IA32_ARG_FIXUP noebp=0
  28. movl %edi,%r8d
  29. .if \noebp
  30. .else
  31. movl %ebp,%r9d
  32. .endif
  33. xchg %ecx,%esi
  34. movl %ebx,%edi
  35. movl %edx,%edx /* zero extension */
  36. .endm
  37. /* clobbers %eax */
  38. .macro CLEAR_RREGS offset=0, _r9=rax
  39. xorl %eax,%eax
  40. movq %rax,\offset+R11(%rsp)
  41. movq %rax,\offset+R10(%rsp)
  42. movq %\_r9,\offset+R9(%rsp)
  43. movq %rax,\offset+R8(%rsp)
  44. .endm
  45. /*
  46. * Reload arg registers from stack in case ptrace changed them.
  47. * We don't reload %eax because syscall_trace_enter() returned
  48. * the %rax value we should see. Instead, we just truncate that
  49. * value to 32 bits again as we did on entry from user mode.
  50. * If it's a new value set by user_regset during entry tracing,
  51. * this matches the normal truncation of the user-mode value.
  52. * If it's -1 to make us punt the syscall, then (u32)-1 is still
  53. * an appropriately invalid value.
  54. */
  55. .macro LOAD_ARGS32 offset, _r9=0
  56. .if \_r9
  57. movl \offset+16(%rsp),%r9d
  58. .endif
  59. movl \offset+40(%rsp),%ecx
  60. movl \offset+48(%rsp),%edx
  61. movl \offset+56(%rsp),%esi
  62. movl \offset+64(%rsp),%edi
  63. movl %eax,%eax /* zero extension */
  64. .endm
  65. .macro CFI_STARTPROC32 simple
  66. CFI_STARTPROC \simple
  67. CFI_UNDEFINED r8
  68. CFI_UNDEFINED r9
  69. CFI_UNDEFINED r10
  70. CFI_UNDEFINED r11
  71. CFI_UNDEFINED r12
  72. CFI_UNDEFINED r13
  73. CFI_UNDEFINED r14
  74. CFI_UNDEFINED r15
  75. .endm
  76. #ifdef CONFIG_PARAVIRT
  77. ENTRY(native_usergs_sysret32)
  78. swapgs
  79. sysretl
  80. ENDPROC(native_usergs_sysret32)
  81. ENTRY(native_irq_enable_sysexit)
  82. swapgs
  83. sti
  84. sysexit
  85. ENDPROC(native_irq_enable_sysexit)
  86. #endif
  87. /*
  88. * 32bit SYSENTER instruction entry.
  89. *
  90. * Arguments:
  91. * %eax System call number.
  92. * %ebx Arg1
  93. * %ecx Arg2
  94. * %edx Arg3
  95. * %esi Arg4
  96. * %edi Arg5
  97. * %ebp user stack
  98. * 0(%ebp) Arg6
  99. *
  100. * Interrupts off.
  101. *
  102. * This is purely a fast path. For anything complicated we use the int 0x80
  103. * path below. Set up a complete hardware stack frame to share code
  104. * with the int 0x80 path.
  105. */
  106. ENTRY(ia32_sysenter_target)
  107. CFI_STARTPROC32 simple
  108. CFI_SIGNAL_FRAME
  109. CFI_DEF_CFA rsp,0
  110. CFI_REGISTER rsp,rbp
  111. SWAPGS_UNSAFE_STACK
  112. movq PER_CPU_VAR(kernel_stack), %rsp
  113. addq $(KERNEL_STACK_OFFSET),%rsp
  114. /*
  115. * No need to follow this irqs on/off section: the syscall
  116. * disabled irqs, here we enable it straight after entry:
  117. */
  118. ENABLE_INTERRUPTS(CLBR_NONE)
  119. movl %ebp,%ebp /* zero extension */
  120. pushq_cfi $__USER32_DS
  121. /*CFI_REL_OFFSET ss,0*/
  122. pushq_cfi %rbp
  123. CFI_REL_OFFSET rsp,0
  124. pushfq_cfi
  125. /*CFI_REL_OFFSET rflags,0*/
  126. movl TI_sysenter_return+THREAD_INFO(%rsp,3*8-KERNEL_STACK_OFFSET),%r10d
  127. CFI_REGISTER rip,r10
  128. pushq_cfi $__USER32_CS
  129. /*CFI_REL_OFFSET cs,0*/
  130. movl %eax, %eax
  131. pushq_cfi %r10
  132. CFI_REL_OFFSET rip,0
  133. pushq_cfi %rax
  134. cld
  135. SAVE_ARGS 0,1,0
  136. /* no need to do an access_ok check here because rbp has been
  137. 32bit zero extended */
  138. 1: movl (%rbp),%ebp
  139. _ASM_EXTABLE(1b,ia32_badarg)
  140. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  141. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  142. CFI_REMEMBER_STATE
  143. jnz sysenter_tracesys
  144. cmpq $(IA32_NR_syscalls-1),%rax
  145. ja ia32_badsys
  146. sysenter_do_call:
  147. IA32_ARG_FIXUP
  148. sysenter_dispatch:
  149. call *ia32_sys_call_table(,%rax,8)
  150. movq %rax,RAX-ARGOFFSET(%rsp)
  151. DISABLE_INTERRUPTS(CLBR_NONE)
  152. TRACE_IRQS_OFF
  153. testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  154. jnz sysexit_audit
  155. sysexit_from_sys_call:
  156. andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  157. /* clear IF, that popfq doesn't enable interrupts early */
  158. andl $~0x200,EFLAGS-R11(%rsp)
  159. movl RIP-R11(%rsp),%edx /* User %eip */
  160. CFI_REGISTER rip,rdx
  161. RESTORE_ARGS 0,24,0,0,0,0
  162. xorq %r8,%r8
  163. xorq %r9,%r9
  164. xorq %r10,%r10
  165. xorq %r11,%r11
  166. popfq_cfi
  167. /*CFI_RESTORE rflags*/
  168. popq_cfi %rcx /* User %esp */
  169. CFI_REGISTER rsp,rcx
  170. TRACE_IRQS_ON
  171. ENABLE_INTERRUPTS_SYSEXIT32
  172. #ifdef CONFIG_AUDITSYSCALL
  173. .macro auditsys_entry_common
  174. movl %esi,%r9d /* 6th arg: 4th syscall arg */
  175. movl %edx,%r8d /* 5th arg: 3rd syscall arg */
  176. /* (already in %ecx) 4th arg: 2nd syscall arg */
  177. movl %ebx,%edx /* 3rd arg: 1st syscall arg */
  178. movl %eax,%esi /* 2nd arg: syscall number */
  179. movl $AUDIT_ARCH_I386,%edi /* 1st arg: audit arch */
  180. call __audit_syscall_entry
  181. movl RAX-ARGOFFSET(%rsp),%eax /* reload syscall number */
  182. cmpq $(IA32_NR_syscalls-1),%rax
  183. ja ia32_badsys
  184. movl %ebx,%edi /* reload 1st syscall arg */
  185. movl RCX-ARGOFFSET(%rsp),%esi /* reload 2nd syscall arg */
  186. movl RDX-ARGOFFSET(%rsp),%edx /* reload 3rd syscall arg */
  187. movl RSI-ARGOFFSET(%rsp),%ecx /* reload 4th syscall arg */
  188. movl RDI-ARGOFFSET(%rsp),%r8d /* reload 5th syscall arg */
  189. .endm
  190. .macro auditsys_exit exit
  191. testl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  192. jnz ia32_ret_from_sys_call
  193. TRACE_IRQS_ON
  194. sti
  195. movl %eax,%esi /* second arg, syscall return value */
  196. cmpl $-MAX_ERRNO,%eax /* is it an error ? */
  197. jbe 1f
  198. movslq %eax, %rsi /* if error sign extend to 64 bits */
  199. 1: setbe %al /* 1 if error, 0 if not */
  200. movzbl %al,%edi /* zero-extend that into %edi */
  201. call __audit_syscall_exit
  202. movq RAX-ARGOFFSET(%rsp),%rax /* reload syscall return value */
  203. movl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),%edi
  204. cli
  205. TRACE_IRQS_OFF
  206. testl %edi,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  207. jz \exit
  208. CLEAR_RREGS -ARGOFFSET
  209. jmp int_with_check
  210. .endm
  211. sysenter_auditsys:
  212. CFI_RESTORE_STATE
  213. auditsys_entry_common
  214. movl %ebp,%r9d /* reload 6th syscall arg */
  215. jmp sysenter_dispatch
  216. sysexit_audit:
  217. auditsys_exit sysexit_from_sys_call
  218. #endif
  219. sysenter_tracesys:
  220. #ifdef CONFIG_AUDITSYSCALL
  221. testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  222. jz sysenter_auditsys
  223. #endif
  224. SAVE_REST
  225. CLEAR_RREGS
  226. movq $-ENOSYS,RAX(%rsp)/* ptrace can change this for a bad syscall */
  227. movq %rsp,%rdi /* &pt_regs -> arg1 */
  228. call syscall_trace_enter
  229. LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
  230. RESTORE_REST
  231. cmpq $(IA32_NR_syscalls-1),%rax
  232. ja int_ret_from_sys_call /* sysenter_tracesys has set RAX(%rsp) */
  233. jmp sysenter_do_call
  234. CFI_ENDPROC
  235. ENDPROC(ia32_sysenter_target)
  236. /*
  237. * 32bit SYSCALL instruction entry.
  238. *
  239. * Arguments:
  240. * %eax System call number.
  241. * %ebx Arg1
  242. * %ecx return EIP
  243. * %edx Arg3
  244. * %esi Arg4
  245. * %edi Arg5
  246. * %ebp Arg2 [note: not saved in the stack frame, should not be touched]
  247. * %esp user stack
  248. * 0(%esp) Arg6
  249. *
  250. * Interrupts off.
  251. *
  252. * This is purely a fast path. For anything complicated we use the int 0x80
  253. * path below. Set up a complete hardware stack frame to share code
  254. * with the int 0x80 path.
  255. */
  256. ENTRY(ia32_cstar_target)
  257. CFI_STARTPROC32 simple
  258. CFI_SIGNAL_FRAME
  259. CFI_DEF_CFA rsp,KERNEL_STACK_OFFSET
  260. CFI_REGISTER rip,rcx
  261. /*CFI_REGISTER rflags,r11*/
  262. SWAPGS_UNSAFE_STACK
  263. movl %esp,%r8d
  264. CFI_REGISTER rsp,r8
  265. movq PER_CPU_VAR(kernel_stack),%rsp
  266. /*
  267. * No need to follow this irqs on/off section: the syscall
  268. * disabled irqs and here we enable it straight after entry:
  269. */
  270. ENABLE_INTERRUPTS(CLBR_NONE)
  271. SAVE_ARGS 8,0,0
  272. movl %eax,%eax /* zero extension */
  273. movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
  274. movq %rcx,RIP-ARGOFFSET(%rsp)
  275. CFI_REL_OFFSET rip,RIP-ARGOFFSET
  276. movq %rbp,RCX-ARGOFFSET(%rsp) /* this lies slightly to ptrace */
  277. movl %ebp,%ecx
  278. movq $__USER32_CS,CS-ARGOFFSET(%rsp)
  279. movq $__USER32_DS,SS-ARGOFFSET(%rsp)
  280. movq %r11,EFLAGS-ARGOFFSET(%rsp)
  281. /*CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
  282. movq %r8,RSP-ARGOFFSET(%rsp)
  283. CFI_REL_OFFSET rsp,RSP-ARGOFFSET
  284. /* no need to do an access_ok check here because r8 has been
  285. 32bit zero extended */
  286. /* hardware stack frame is complete now */
  287. 1: movl (%r8),%r9d
  288. _ASM_EXTABLE(1b,ia32_badarg)
  289. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  290. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  291. CFI_REMEMBER_STATE
  292. jnz cstar_tracesys
  293. cmpq $IA32_NR_syscalls-1,%rax
  294. ja ia32_badsys
  295. cstar_do_call:
  296. IA32_ARG_FIXUP 1
  297. cstar_dispatch:
  298. call *ia32_sys_call_table(,%rax,8)
  299. movq %rax,RAX-ARGOFFSET(%rsp)
  300. DISABLE_INTERRUPTS(CLBR_NONE)
  301. TRACE_IRQS_OFF
  302. testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  303. jnz sysretl_audit
  304. sysretl_from_sys_call:
  305. andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  306. RESTORE_ARGS 0,-ARG_SKIP,0,0,0
  307. movl RIP-ARGOFFSET(%rsp),%ecx
  308. CFI_REGISTER rip,rcx
  309. movl EFLAGS-ARGOFFSET(%rsp),%r11d
  310. /*CFI_REGISTER rflags,r11*/
  311. xorq %r10,%r10
  312. xorq %r9,%r9
  313. xorq %r8,%r8
  314. TRACE_IRQS_ON
  315. movl RSP-ARGOFFSET(%rsp),%esp
  316. CFI_RESTORE rsp
  317. USERGS_SYSRET32
  318. #ifdef CONFIG_AUDITSYSCALL
  319. cstar_auditsys:
  320. CFI_RESTORE_STATE
  321. movl %r9d,R9-ARGOFFSET(%rsp) /* register to be clobbered by call */
  322. auditsys_entry_common
  323. movl R9-ARGOFFSET(%rsp),%r9d /* reload 6th syscall arg */
  324. jmp cstar_dispatch
  325. sysretl_audit:
  326. auditsys_exit sysretl_from_sys_call
  327. #endif
  328. cstar_tracesys:
  329. #ifdef CONFIG_AUDITSYSCALL
  330. testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  331. jz cstar_auditsys
  332. #endif
  333. xchgl %r9d,%ebp
  334. SAVE_REST
  335. CLEAR_RREGS 0, r9
  336. movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
  337. movq %rsp,%rdi /* &pt_regs -> arg1 */
  338. call syscall_trace_enter
  339. LOAD_ARGS32 ARGOFFSET, 1 /* reload args from stack in case ptrace changed it */
  340. RESTORE_REST
  341. xchgl %ebp,%r9d
  342. cmpq $(IA32_NR_syscalls-1),%rax
  343. ja int_ret_from_sys_call /* cstar_tracesys has set RAX(%rsp) */
  344. jmp cstar_do_call
  345. END(ia32_cstar_target)
  346. ia32_badarg:
  347. movq $-EFAULT,%rax
  348. jmp ia32_sysret
  349. CFI_ENDPROC
  350. /*
  351. * Emulated IA32 system calls via int 0x80.
  352. *
  353. * Arguments:
  354. * %eax System call number.
  355. * %ebx Arg1
  356. * %ecx Arg2
  357. * %edx Arg3
  358. * %esi Arg4
  359. * %edi Arg5
  360. * %ebp Arg6 [note: not saved in the stack frame, should not be touched]
  361. *
  362. * Notes:
  363. * Uses the same stack frame as the x86-64 version.
  364. * All registers except %eax must be saved (but ptrace may violate that)
  365. * Arguments are zero extended. For system calls that want sign extension and
  366. * take long arguments a wrapper is needed. Most calls can just be called
  367. * directly.
  368. * Assumes it is only called from user space and entered with interrupts off.
  369. */
  370. ENTRY(ia32_syscall)
  371. CFI_STARTPROC32 simple
  372. CFI_SIGNAL_FRAME
  373. CFI_DEF_CFA rsp,SS+8-RIP
  374. /*CFI_REL_OFFSET ss,SS-RIP*/
  375. CFI_REL_OFFSET rsp,RSP-RIP
  376. /*CFI_REL_OFFSET rflags,EFLAGS-RIP*/
  377. /*CFI_REL_OFFSET cs,CS-RIP*/
  378. CFI_REL_OFFSET rip,RIP-RIP
  379. PARAVIRT_ADJUST_EXCEPTION_FRAME
  380. SWAPGS
  381. /*
  382. * No need to follow this irqs on/off section: the syscall
  383. * disabled irqs and here we enable it straight after entry:
  384. */
  385. ENABLE_INTERRUPTS(CLBR_NONE)
  386. movl %eax,%eax
  387. pushq_cfi %rax
  388. cld
  389. /* note the registers are not zero extended to the sf.
  390. this could be a problem. */
  391. SAVE_ARGS 0,1,0
  392. orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  393. testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
  394. jnz ia32_tracesys
  395. cmpq $(IA32_NR_syscalls-1),%rax
  396. ja ia32_badsys
  397. ia32_do_call:
  398. IA32_ARG_FIXUP
  399. call *ia32_sys_call_table(,%rax,8) # xxx: rip relative
  400. ia32_sysret:
  401. movq %rax,RAX-ARGOFFSET(%rsp)
  402. ia32_ret_from_sys_call:
  403. CLEAR_RREGS -ARGOFFSET
  404. jmp int_ret_from_sys_call
  405. ia32_tracesys:
  406. SAVE_REST
  407. CLEAR_RREGS
  408. movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
  409. movq %rsp,%rdi /* &pt_regs -> arg1 */
  410. call syscall_trace_enter
  411. LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
  412. RESTORE_REST
  413. cmpq $(IA32_NR_syscalls-1),%rax
  414. ja int_ret_from_sys_call /* ia32_tracesys has set RAX(%rsp) */
  415. jmp ia32_do_call
  416. END(ia32_syscall)
  417. ia32_badsys:
  418. movq $0,ORIG_RAX-ARGOFFSET(%rsp)
  419. movq $-ENOSYS,%rax
  420. jmp ia32_sysret
  421. CFI_ENDPROC
  422. .macro PTREGSCALL label, func, arg
  423. ALIGN
  424. GLOBAL(\label)
  425. leaq \func(%rip),%rax
  426. leaq -ARGOFFSET+8(%rsp),\arg /* 8 for return address */
  427. jmp ia32_ptregs_common
  428. .endm
  429. CFI_STARTPROC32
  430. PTREGSCALL stub32_rt_sigreturn, sys32_rt_sigreturn, %rdi
  431. PTREGSCALL stub32_sigreturn, sys32_sigreturn, %rdi
  432. PTREGSCALL stub32_sigaltstack, sys32_sigaltstack, %rdx
  433. PTREGSCALL stub32_execve, sys32_execve, %rcx
  434. PTREGSCALL stub32_fork, sys_fork, %rdi
  435. PTREGSCALL stub32_clone, sys32_clone, %rdx
  436. PTREGSCALL stub32_vfork, sys_vfork, %rdi
  437. PTREGSCALL stub32_iopl, sys_iopl, %rsi
  438. ALIGN
  439. ia32_ptregs_common:
  440. popq %r11
  441. CFI_ENDPROC
  442. CFI_STARTPROC32 simple
  443. CFI_SIGNAL_FRAME
  444. CFI_DEF_CFA rsp,SS+8-ARGOFFSET
  445. CFI_REL_OFFSET rax,RAX-ARGOFFSET
  446. CFI_REL_OFFSET rcx,RCX-ARGOFFSET
  447. CFI_REL_OFFSET rdx,RDX-ARGOFFSET
  448. CFI_REL_OFFSET rsi,RSI-ARGOFFSET
  449. CFI_REL_OFFSET rdi,RDI-ARGOFFSET
  450. CFI_REL_OFFSET rip,RIP-ARGOFFSET
  451. /* CFI_REL_OFFSET cs,CS-ARGOFFSET*/
  452. /* CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
  453. CFI_REL_OFFSET rsp,RSP-ARGOFFSET
  454. /* CFI_REL_OFFSET ss,SS-ARGOFFSET*/
  455. SAVE_REST
  456. call *%rax
  457. RESTORE_REST
  458. jmp ia32_sysret /* misbalances the return cache */
  459. CFI_ENDPROC
  460. END(ia32_ptregs_common)