fsys.S 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884
  1. /*
  2. * This file contains the light-weight system call handlers (fsyscall-handlers).
  3. *
  4. * Copyright (C) 2003 Hewlett-Packard Co
  5. * David Mosberger-Tang <davidm@hpl.hp.com>
  6. *
  7. * 25-Sep-03 davidm Implement fsys_rt_sigprocmask().
  8. * 18-Feb-03 louisk Implement fsys_gettimeofday().
  9. * 28-Feb-03 davidm Fixed several bugs in fsys_gettimeofday(). Tuned it some more,
  10. * probably broke it along the way... ;-)
  11. * 13-Jul-04 clameter Implement fsys_clock_gettime and revise fsys_gettimeofday to make
  12. * it capable of using memory based clocks without falling back to C code.
  13. */
  14. #include <asm/asmmacro.h>
  15. #include <asm/errno.h>
  16. #include <asm/offsets.h>
  17. #include <asm/percpu.h>
  18. #include <asm/thread_info.h>
  19. #include <asm/sal.h>
  20. #include <asm/signal.h>
  21. #include <asm/system.h>
  22. #include <asm/unistd.h>
  23. #include "entry.h"
  24. /*
  25. * See Documentation/ia64/fsys.txt for details on fsyscalls.
  26. *
  27. * On entry to an fsyscall handler:
  28. * r10 = 0 (i.e., defaults to "successful syscall return")
  29. * r11 = saved ar.pfs (a user-level value)
  30. * r15 = system call number
  31. * r16 = "current" task pointer (in normal kernel-mode, this is in r13)
  32. * r32-r39 = system call arguments
  33. * b6 = return address (a user-level value)
  34. * ar.pfs = previous frame-state (a user-level value)
  35. * PSR.be = cleared to zero (i.e., little-endian byte order is in effect)
  36. * all other registers may contain values passed in from user-mode
  37. *
  38. * On return from an fsyscall handler:
  39. * r11 = saved ar.pfs (as passed into the fsyscall handler)
  40. * r15 = system call number (as passed into the fsyscall handler)
  41. * r32-r39 = system call arguments (as passed into the fsyscall handler)
  42. * b6 = return address (as passed into the fsyscall handler)
  43. * ar.pfs = previous frame-state (as passed into the fsyscall handler)
  44. */
  45. ENTRY(fsys_ni_syscall)
  46. .prologue
  47. .altrp b6
  48. .body
  49. mov r8=ENOSYS
  50. mov r10=-1
  51. FSYS_RETURN
  52. END(fsys_ni_syscall)
  53. ENTRY(fsys_getpid)
  54. .prologue
  55. .altrp b6
  56. .body
  57. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  58. ;;
  59. ld4 r9=[r9]
  60. add r8=IA64_TASK_TGID_OFFSET,r16
  61. ;;
  62. and r9=TIF_ALLWORK_MASK,r9
  63. ld4 r8=[r8] // r8 = current->tgid
  64. ;;
  65. cmp.ne p8,p0=0,r9
  66. (p8) br.spnt.many fsys_fallback_syscall
  67. FSYS_RETURN
  68. END(fsys_getpid)
  69. ENTRY(fsys_getppid)
  70. .prologue
  71. .altrp b6
  72. .body
  73. add r17=IA64_TASK_GROUP_LEADER_OFFSET,r16
  74. ;;
  75. ld8 r17=[r17] // r17 = current->group_leader
  76. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  77. ;;
  78. ld4 r9=[r9]
  79. add r17=IA64_TASK_REAL_PARENT_OFFSET,r17 // r17 = &current->group_leader->real_parent
  80. ;;
  81. and r9=TIF_ALLWORK_MASK,r9
  82. 1: ld8 r18=[r17] // r18 = current->group_leader->real_parent
  83. ;;
  84. cmp.ne p8,p0=0,r9
  85. add r8=IA64_TASK_TGID_OFFSET,r18 // r8 = &current->group_leader->real_parent->tgid
  86. ;;
  87. /*
  88. * The .acq is needed to ensure that the read of tgid has returned its data before
  89. * we re-check "real_parent".
  90. */
  91. ld4.acq r8=[r8] // r8 = current->group_leader->real_parent->tgid
  92. #ifdef CONFIG_SMP
  93. /*
  94. * Re-read current->group_leader->real_parent.
  95. */
  96. ld8 r19=[r17] // r19 = current->group_leader->real_parent
  97. (p8) br.spnt.many fsys_fallback_syscall
  98. ;;
  99. cmp.ne p6,p0=r18,r19 // did real_parent change?
  100. mov r19=0 // i must not leak kernel bits...
  101. (p6) br.cond.spnt.few 1b // yes -> redo the read of tgid and the check
  102. ;;
  103. mov r17=0 // i must not leak kernel bits...
  104. mov r18=0 // i must not leak kernel bits...
  105. #else
  106. mov r17=0 // i must not leak kernel bits...
  107. mov r18=0 // i must not leak kernel bits...
  108. mov r19=0 // i must not leak kernel bits...
  109. #endif
  110. FSYS_RETURN
  111. END(fsys_getppid)
  112. ENTRY(fsys_set_tid_address)
  113. .prologue
  114. .altrp b6
  115. .body
  116. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  117. ;;
  118. ld4 r9=[r9]
  119. tnat.z p6,p7=r32 // check argument register for being NaT
  120. ;;
  121. and r9=TIF_ALLWORK_MASK,r9
  122. add r8=IA64_TASK_PID_OFFSET,r16
  123. add r18=IA64_TASK_CLEAR_CHILD_TID_OFFSET,r16
  124. ;;
  125. ld4 r8=[r8]
  126. cmp.ne p8,p0=0,r9
  127. mov r17=-1
  128. ;;
  129. (p6) st8 [r18]=r32
  130. (p7) st8 [r18]=r17
  131. (p8) br.spnt.many fsys_fallback_syscall
  132. ;;
  133. mov r17=0 // i must not leak kernel bits...
  134. mov r18=0 // i must not leak kernel bits...
  135. FSYS_RETURN
  136. END(fsys_set_tid_address)
  137. /*
  138. * Ensure that the time interpolator structure is compatible with the asm code
  139. */
  140. #if IA64_TIME_INTERPOLATOR_SOURCE_OFFSET !=0 || IA64_TIME_INTERPOLATOR_SHIFT_OFFSET != 2 \
  141. || IA64_TIME_INTERPOLATOR_JITTER_OFFSET != 3 || IA64_TIME_INTERPOLATOR_NSEC_OFFSET != 4
  142. #error fsys_gettimeofday incompatible with changes to struct time_interpolator
  143. #endif
  144. #define CLOCK_REALTIME 0
  145. #define CLOCK_MONOTONIC 1
  146. #define CLOCK_DIVIDE_BY_1000 0x4000
  147. #define CLOCK_ADD_MONOTONIC 0x8000
  148. ENTRY(fsys_gettimeofday)
  149. .prologue
  150. .altrp b6
  151. .body
  152. mov r31 = r32
  153. tnat.nz p6,p0 = r33 // guard against NaT argument
  154. (p6) br.cond.spnt.few .fail_einval
  155. mov r30 = CLOCK_DIVIDE_BY_1000
  156. ;;
  157. .gettime:
  158. // Register map
  159. // Incoming r31 = pointer to address where to place result
  160. // r30 = flags determining how time is processed
  161. // r2,r3 = temp r4-r7 preserved
  162. // r8 = result nanoseconds
  163. // r9 = result seconds
  164. // r10 = temporary storage for clock difference
  165. // r11 = preserved: saved ar.pfs
  166. // r12 = preserved: memory stack
  167. // r13 = preserved: thread pointer
  168. // r14 = address of mask / mask
  169. // r15 = preserved: system call number
  170. // r16 = preserved: current task pointer
  171. // r17 = wall to monotonic use
  172. // r18 = time_interpolator->offset
  173. // r19 = address of wall_to_monotonic
  174. // r20 = pointer to struct time_interpolator / pointer to time_interpolator->address
  175. // r21 = shift factor
  176. // r22 = address of time interpolator->last_counter
  177. // r23 = address of time_interpolator->last_cycle
  178. // r24 = adress of time_interpolator->offset
  179. // r25 = last_cycle value
  180. // r26 = last_counter value
  181. // r27 = pointer to xtime
  182. // r28 = sequence number at the beginning of critcal section
  183. // r29 = address of seqlock
  184. // r30 = time processing flags / memory address
  185. // r31 = pointer to result
  186. // Predicates
  187. // p6,p7 short term use
  188. // p8 = timesource ar.itc
  189. // p9 = timesource mmio64
  190. // p10 = timesource mmio32
  191. // p11 = timesource not to be handled by asm code
  192. // p12 = memory time source ( = p9 | p10)
  193. // p13 = do cmpxchg with time_interpolator_last_cycle
  194. // p14 = Divide by 1000
  195. // p15 = Add monotonic
  196. //
  197. // Note that instructions are optimized for McKinley. McKinley can process two
  198. // bundles simultaneously and therefore we continuously try to feed the CPU
  199. // two bundles and then a stop.
  200. tnat.nz p6,p0 = r31 // branch deferred since it does not fit into bundle structure
  201. mov pr = r30,0xc000 // Set predicates according to function
  202. add r2 = TI_FLAGS+IA64_TASK_SIZE,r16
  203. movl r20 = time_interpolator
  204. ;;
  205. ld8 r20 = [r20] // get pointer to time_interpolator structure
  206. movl r29 = xtime_lock
  207. ld4 r2 = [r2] // process work pending flags
  208. movl r27 = xtime
  209. ;; // only one bundle here
  210. ld8 r21 = [r20] // first quad with control information
  211. and r2 = TIF_ALLWORK_MASK,r2
  212. (p6) br.cond.spnt.few .fail_einval // deferred branch
  213. ;;
  214. add r10 = IA64_TIME_INTERPOLATOR_ADDRESS_OFFSET,r20
  215. extr r3 = r21,32,32 // time_interpolator->nsec_per_cyc
  216. extr r8 = r21,0,16 // time_interpolator->source
  217. cmp.ne p6, p0 = 0, r2 // Fallback if work is scheduled
  218. (p6) br.cond.spnt.many fsys_fallback_syscall
  219. ;;
  220. cmp.eq p8,p12 = 0,r8 // Check for cpu timer
  221. cmp.eq p9,p0 = 1,r8 // MMIO64 ?
  222. extr r2 = r21,24,8 // time_interpolator->jitter
  223. cmp.eq p10,p0 = 2,r8 // MMIO32 ?
  224. cmp.ltu p11,p0 = 2,r8 // function or other clock
  225. (p11) br.cond.spnt.many fsys_fallback_syscall
  226. ;;
  227. setf.sig f7 = r3 // Setup for scaling of counter
  228. (p15) movl r19 = wall_to_monotonic
  229. (p12) ld8 r30 = [r10]
  230. cmp.ne p13,p0 = r2,r0 // need jitter compensation?
  231. extr r21 = r21,16,8 // shift factor
  232. ;;
  233. .time_redo:
  234. .pred.rel.mutex p8,p9,p10
  235. ld4.acq r28 = [r29] // xtime_lock.sequence. Must come first for locking purposes
  236. (p8) mov r2 = ar.itc // CPU_TIMER. 36 clocks latency!!!
  237. add r22 = IA64_TIME_INTERPOLATOR_LAST_COUNTER_OFFSET,r20
  238. (p9) ld8 r2 = [r30] // readq(ti->address). Could also have latency issues..
  239. (p10) ld4 r2 = [r30] // readw(ti->address)
  240. (p13) add r23 = IA64_TIME_INTERPOLATOR_LAST_CYCLE_OFFSET,r20
  241. ;; // could be removed by moving the last add upward
  242. ld8 r26 = [r22] // time_interpolator->last_counter
  243. (p13) ld8 r25 = [r23] // time interpolator->last_cycle
  244. add r24 = IA64_TIME_INTERPOLATOR_OFFSET_OFFSET,r20
  245. (p15) ld8 r17 = [r19],IA64_TIMESPEC_TV_NSEC_OFFSET
  246. ld8 r9 = [r27],IA64_TIMESPEC_TV_NSEC_OFFSET
  247. add r14 = IA64_TIME_INTERPOLATOR_MASK_OFFSET, r20
  248. ;;
  249. ld8 r18 = [r24] // time_interpolator->offset
  250. ld8 r8 = [r27],-IA64_TIMESPEC_TV_NSEC_OFFSET // xtime.tv_nsec
  251. (p13) sub r3 = r25,r2 // Diff needed before comparison (thanks davidm)
  252. ;;
  253. ld8 r14 = [r14] // time_interpolator->mask
  254. (p13) cmp.gt.unc p6,p7 = r3,r0 // check if it is less than last. p6,p7 cleared
  255. sub r10 = r2,r26 // current_counter - last_counter
  256. ;;
  257. (p6) sub r10 = r25,r26 // time we got was less than last_cycle
  258. (p7) mov ar.ccv = r25 // more than last_cycle. Prep for cmpxchg
  259. ;;
  260. and r10 = r10,r14 // Apply mask
  261. ;;
  262. setf.sig f8 = r10
  263. nop.i 123
  264. ;;
  265. (p7) cmpxchg8.rel r3 = [r23],r2,ar.ccv
  266. EX(.fail_efault, probe.w.fault r31, 3) // This takes 5 cycles and we have spare time
  267. xmpy.l f8 = f8,f7 // nsec_per_cyc*(counter-last_counter)
  268. (p15) add r9 = r9,r17 // Add wall to monotonic.secs to result secs
  269. ;;
  270. (p15) ld8 r17 = [r19],-IA64_TIMESPEC_TV_NSEC_OFFSET
  271. (p7) cmp.ne p7,p0 = r25,r3 // if cmpxchg not successful redo
  272. // simulate tbit.nz.or p7,p0 = r28,0
  273. and r28 = ~1,r28 // Make sequence even to force retry if odd
  274. getf.sig r2 = f8
  275. mf
  276. add r8 = r8,r18 // Add time interpolator offset
  277. ;;
  278. ld4 r10 = [r29] // xtime_lock.sequence
  279. (p15) add r8 = r8, r17 // Add monotonic.nsecs to nsecs
  280. shr.u r2 = r2,r21
  281. ;; // overloaded 3 bundles!
  282. // End critical section.
  283. add r8 = r8,r2 // Add xtime.nsecs
  284. cmp4.ne.or p7,p0 = r28,r10
  285. (p7) br.cond.dpnt.few .time_redo // sequence number changed ?
  286. // Now r8=tv->tv_nsec and r9=tv->tv_sec
  287. mov r10 = r0
  288. movl r2 = 1000000000
  289. add r23 = IA64_TIMESPEC_TV_NSEC_OFFSET, r31
  290. (p14) movl r3 = 2361183241434822607 // Prep for / 1000 hack
  291. ;;
  292. .time_normalize:
  293. mov r21 = r8
  294. cmp.ge p6,p0 = r8,r2
  295. (p14) shr.u r20 = r8, 3 // We can repeat this if necessary just wasting some time
  296. ;;
  297. (p14) setf.sig f8 = r20
  298. (p6) sub r8 = r8,r2
  299. (p6) add r9 = 1,r9 // two nops before the branch.
  300. (p14) setf.sig f7 = r3 // Chances for repeats are 1 in 10000 for gettod
  301. (p6) br.cond.dpnt.few .time_normalize
  302. ;;
  303. // Divided by 8 though shift. Now divide by 125
  304. // The compiler was able to do that with a multiply
  305. // and a shift and we do the same
  306. EX(.fail_efault, probe.w.fault r23, 3) // This also costs 5 cycles
  307. (p14) xmpy.hu f8 = f8, f7 // xmpy has 5 cycles latency so use it...
  308. ;;
  309. mov r8 = r0
  310. (p14) getf.sig r2 = f8
  311. ;;
  312. (p14) shr.u r21 = r2, 4
  313. ;;
  314. EX(.fail_efault, st8 [r31] = r9)
  315. EX(.fail_efault, st8 [r23] = r21)
  316. FSYS_RETURN
  317. .fail_einval:
  318. mov r8 = EINVAL
  319. mov r10 = -1
  320. FSYS_RETURN
  321. .fail_efault:
  322. mov r8 = EFAULT
  323. mov r10 = -1
  324. FSYS_RETURN
  325. END(fsys_gettimeofday)
  326. ENTRY(fsys_clock_gettime)
  327. .prologue
  328. .altrp b6
  329. .body
  330. cmp4.ltu p6, p0 = CLOCK_MONOTONIC, r32
  331. // Fallback if this is not CLOCK_REALTIME or CLOCK_MONOTONIC
  332. (p6) br.spnt.few fsys_fallback_syscall
  333. mov r31 = r33
  334. shl r30 = r32,15
  335. br.many .gettime
  336. END(fsys_clock_gettime)
  337. /*
  338. * long fsys_rt_sigprocmask (int how, sigset_t *set, sigset_t *oset, size_t sigsetsize).
  339. */
  340. #if _NSIG_WORDS != 1
  341. # error Sorry, fsys_rt_sigprocmask() needs to be updated for _NSIG_WORDS != 1.
  342. #endif
  343. ENTRY(fsys_rt_sigprocmask)
  344. .prologue
  345. .altrp b6
  346. .body
  347. add r2=IA64_TASK_BLOCKED_OFFSET,r16
  348. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  349. cmp4.ltu p6,p0=SIG_SETMASK,r32
  350. cmp.ne p15,p0=r0,r34 // oset != NULL?
  351. tnat.nz p8,p0=r34
  352. add r31=IA64_TASK_SIGHAND_OFFSET,r16
  353. ;;
  354. ld8 r3=[r2] // read/prefetch current->blocked
  355. ld4 r9=[r9]
  356. tnat.nz.or p6,p0=r35
  357. cmp.ne.or p6,p0=_NSIG_WORDS*8,r35
  358. tnat.nz.or p6,p0=r32
  359. (p6) br.spnt.few .fail_einval // fail with EINVAL
  360. ;;
  361. #ifdef CONFIG_SMP
  362. ld8 r31=[r31] // r31 <- current->sighand
  363. #endif
  364. and r9=TIF_ALLWORK_MASK,r9
  365. tnat.nz.or p8,p0=r33
  366. ;;
  367. cmp.ne p7,p0=0,r9
  368. cmp.eq p6,p0=r0,r33 // set == NULL?
  369. add r31=IA64_SIGHAND_SIGLOCK_OFFSET,r31 // r31 <- current->sighand->siglock
  370. (p8) br.spnt.few .fail_efault // fail with EFAULT
  371. (p7) br.spnt.many fsys_fallback_syscall // got pending kernel work...
  372. (p6) br.dpnt.many .store_mask // -> short-circuit to just reading the signal mask
  373. /* Argh, we actually have to do some work and _update_ the signal mask: */
  374. EX(.fail_efault, probe.r.fault r33, 3) // verify user has read-access to *set
  375. EX(.fail_efault, ld8 r14=[r33]) // r14 <- *set
  376. mov r17=(1 << (SIGKILL - 1)) | (1 << (SIGSTOP - 1))
  377. ;;
  378. rsm psr.i // mask interrupt delivery
  379. mov ar.ccv=0
  380. andcm r14=r14,r17 // filter out SIGKILL & SIGSTOP
  381. #ifdef CONFIG_SMP
  382. mov r17=1
  383. ;;
  384. cmpxchg4.acq r18=[r31],r17,ar.ccv // try to acquire the lock
  385. mov r8=EINVAL // default to EINVAL
  386. ;;
  387. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  388. cmp4.ne p6,p0=r18,r0
  389. (p6) br.cond.spnt.many .lock_contention
  390. ;;
  391. #else
  392. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  393. mov r8=EINVAL // default to EINVAL
  394. #endif
  395. add r18=IA64_TASK_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r16
  396. add r19=IA64_TASK_SIGNAL_OFFSET,r16
  397. cmp4.eq p6,p0=SIG_BLOCK,r32
  398. ;;
  399. ld8 r19=[r19] // r19 <- current->signal
  400. cmp4.eq p7,p0=SIG_UNBLOCK,r32
  401. cmp4.eq p8,p0=SIG_SETMASK,r32
  402. ;;
  403. ld8 r18=[r18] // r18 <- current->pending.signal
  404. .pred.rel.mutex p6,p7,p8
  405. (p6) or r14=r3,r14 // SIG_BLOCK
  406. (p7) andcm r14=r3,r14 // SIG_UNBLOCK
  407. (p8) mov r14=r14 // SIG_SETMASK
  408. (p6) mov r8=0 // clear error code
  409. // recalc_sigpending()
  410. add r17=IA64_SIGNAL_GROUP_STOP_COUNT_OFFSET,r19
  411. add r19=IA64_SIGNAL_SHARED_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r19
  412. ;;
  413. ld4 r17=[r17] // r17 <- current->signal->group_stop_count
  414. (p7) mov r8=0 // clear error code
  415. ld8 r19=[r19] // r19 <- current->signal->shared_pending
  416. ;;
  417. cmp4.gt p6,p7=r17,r0 // p6/p7 <- (current->signal->group_stop_count > 0)?
  418. (p8) mov r8=0 // clear error code
  419. or r18=r18,r19 // r18 <- current->pending | current->signal->shared_pending
  420. ;;
  421. // r18 <- (current->pending | current->signal->shared_pending) & ~current->blocked:
  422. andcm r18=r18,r14
  423. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  424. ;;
  425. (p7) cmp.ne.or.andcm p6,p7=r18,r0 // p6/p7 <- signal pending
  426. mov r19=0 // i must not leak kernel bits...
  427. (p6) br.cond.dpnt.many .sig_pending
  428. ;;
  429. 1: ld4 r17=[r9] // r17 <- current->thread_info->flags
  430. ;;
  431. mov ar.ccv=r17
  432. and r18=~_TIF_SIGPENDING,r17 // r18 <- r17 & ~(1 << TIF_SIGPENDING)
  433. ;;
  434. st8 [r2]=r14 // update current->blocked with new mask
  435. cmpxchg4.acq r14=[r9],r18,ar.ccv // current->thread_info->flags <- r18
  436. ;;
  437. cmp.ne p6,p0=r17,r14 // update failed?
  438. (p6) br.cond.spnt.few 1b // yes -> retry
  439. #ifdef CONFIG_SMP
  440. st4.rel [r31]=r0 // release the lock
  441. #endif
  442. ssm psr.i
  443. ;;
  444. srlz.d // ensure psr.i is set again
  445. mov r18=0 // i must not leak kernel bits...
  446. .store_mask:
  447. EX(.fail_efault, (p15) probe.w.fault r34, 3) // verify user has write-access to *oset
  448. EX(.fail_efault, (p15) st8 [r34]=r3)
  449. mov r2=0 // i must not leak kernel bits...
  450. mov r3=0 // i must not leak kernel bits...
  451. mov r8=0 // return 0
  452. mov r9=0 // i must not leak kernel bits...
  453. mov r14=0 // i must not leak kernel bits...
  454. mov r17=0 // i must not leak kernel bits...
  455. mov r31=0 // i must not leak kernel bits...
  456. FSYS_RETURN
  457. .sig_pending:
  458. #ifdef CONFIG_SMP
  459. st4.rel [r31]=r0 // release the lock
  460. #endif
  461. ssm psr.i
  462. ;;
  463. srlz.d
  464. br.sptk.many fsys_fallback_syscall // with signal pending, do the heavy-weight syscall
  465. #ifdef CONFIG_SMP
  466. .lock_contention:
  467. /* Rather than spinning here, fall back on doing a heavy-weight syscall. */
  468. ssm psr.i
  469. ;;
  470. srlz.d
  471. br.sptk.many fsys_fallback_syscall
  472. #endif
  473. END(fsys_rt_sigprocmask)
  474. ENTRY(fsys_fallback_syscall)
  475. .prologue
  476. .altrp b6
  477. .body
  478. /*
  479. * We only get here from light-weight syscall handlers. Thus, we already
  480. * know that r15 contains a valid syscall number. No need to re-check.
  481. */
  482. adds r17=-1024,r15
  483. movl r14=sys_call_table
  484. ;;
  485. rsm psr.i
  486. shladd r18=r17,3,r14
  487. ;;
  488. ld8 r18=[r18] // load normal (heavy-weight) syscall entry-point
  489. mov r29=psr // read psr (12 cyc load latency)
  490. mov r27=ar.rsc
  491. mov r21=ar.fpsr
  492. mov r26=ar.pfs
  493. END(fsys_fallback_syscall)
  494. /* FALL THROUGH */
  495. GLOBAL_ENTRY(fsys_bubble_down)
  496. .prologue
  497. .altrp b6
  498. .body
  499. /*
  500. * We get here for syscalls that don't have a lightweight handler. For those, we
  501. * need to bubble down into the kernel and that requires setting up a minimal
  502. * pt_regs structure, and initializing the CPU state more or less as if an
  503. * interruption had occurred. To make syscall-restarts work, we setup pt_regs
  504. * such that cr_iip points to the second instruction in syscall_via_break.
  505. * Decrementing the IP hence will restart the syscall via break and not
  506. * decrementing IP will return us to the caller, as usual. Note that we preserve
  507. * the value of psr.pp rather than initializing it from dcr.pp. This makes it
  508. * possible to distinguish fsyscall execution from other privileged execution.
  509. *
  510. * On entry:
  511. * - normal fsyscall handler register usage, except that we also have:
  512. * - r18: address of syscall entry point
  513. * - r21: ar.fpsr
  514. * - r26: ar.pfs
  515. * - r27: ar.rsc
  516. * - r29: psr
  517. */
  518. # define PSR_PRESERVED_BITS (IA64_PSR_UP | IA64_PSR_MFL | IA64_PSR_MFH | IA64_PSR_PK \
  519. | IA64_PSR_DT | IA64_PSR_PP | IA64_PSR_SP | IA64_PSR_RT \
  520. | IA64_PSR_IC)
  521. /*
  522. * Reading psr.l gives us only bits 0-31, psr.it, and psr.mc. The rest we have
  523. * to synthesize.
  524. */
  525. # define PSR_ONE_BITS ((3 << IA64_PSR_CPL0_BIT) | (0x1 << IA64_PSR_RI_BIT) \
  526. | IA64_PSR_BN | IA64_PSR_I)
  527. invala
  528. movl r8=PSR_ONE_BITS
  529. mov r25=ar.unat // save ar.unat (5 cyc)
  530. movl r9=PSR_PRESERVED_BITS
  531. mov ar.rsc=0 // set enforced lazy mode, pl 0, little-endian, loadrs=0
  532. movl r28=__kernel_syscall_via_break
  533. ;;
  534. mov r23=ar.bspstore // save ar.bspstore (12 cyc)
  535. mov r31=pr // save pr (2 cyc)
  536. mov r20=r1 // save caller's gp in r20
  537. ;;
  538. mov r2=r16 // copy current task addr to addl-addressable register
  539. and r9=r9,r29
  540. mov r19=b6 // save b6 (2 cyc)
  541. ;;
  542. mov psr.l=r9 // slam the door (17 cyc to srlz.i)
  543. or r29=r8,r29 // construct cr.ipsr value to save
  544. addl r22=IA64_RBS_OFFSET,r2 // compute base of RBS
  545. ;;
  546. // GAS reports a spurious RAW hazard on the read of ar.rnat because it thinks
  547. // we may be reading ar.itc after writing to psr.l. Avoid that message with
  548. // this directive:
  549. dv_serialize_data
  550. mov.m r24=ar.rnat // read ar.rnat (5 cyc lat)
  551. lfetch.fault.excl.nt1 [r22]
  552. adds r16=IA64_TASK_THREAD_ON_USTACK_OFFSET,r2
  553. // ensure previous insn group is issued before we stall for srlz.i:
  554. ;;
  555. srlz.i // ensure new psr.l has been established
  556. /////////////////////////////////////////////////////////////////////////////
  557. ////////// from this point on, execution is not interruptible anymore
  558. /////////////////////////////////////////////////////////////////////////////
  559. addl r1=IA64_STK_OFFSET-IA64_PT_REGS_SIZE,r2 // compute base of memory stack
  560. cmp.ne pKStk,pUStk=r0,r0 // set pKStk <- 0, pUStk <- 1
  561. ;;
  562. st1 [r16]=r0 // clear current->thread.on_ustack flag
  563. mov ar.bspstore=r22 // switch to kernel RBS
  564. mov b6=r18 // copy syscall entry-point to b6 (7 cyc)
  565. add r3=TI_FLAGS+IA64_TASK_SIZE,r2
  566. ;;
  567. ld4 r3=[r3] // r2 = current_thread_info()->flags
  568. mov r18=ar.bsp // save (kernel) ar.bsp (12 cyc)
  569. mov ar.rsc=0x3 // set eager mode, pl 0, little-endian, loadrs=0
  570. br.call.sptk.many b7=ia64_syscall_setup
  571. ;;
  572. ssm psr.i
  573. movl r2=ia64_ret_from_syscall
  574. ;;
  575. mov rp=r2 // set the real return addr
  576. tbit.z p8,p0=r3,TIF_SYSCALL_TRACE
  577. ;;
  578. (p10) br.cond.spnt.many ia64_ret_from_syscall // p10==true means out registers are more than 8
  579. (p8) br.call.sptk.many b6=b6 // ignore this return addr
  580. br.cond.sptk ia64_trace_syscall
  581. END(fsys_bubble_down)
  582. .rodata
  583. .align 8
  584. .globl fsyscall_table
  585. data8 fsys_bubble_down
  586. fsyscall_table:
  587. data8 fsys_ni_syscall
  588. data8 0 // exit // 1025
  589. data8 0 // read
  590. data8 0 // write
  591. data8 0 // open
  592. data8 0 // close
  593. data8 0 // creat // 1030
  594. data8 0 // link
  595. data8 0 // unlink
  596. data8 0 // execve
  597. data8 0 // chdir
  598. data8 0 // fchdir // 1035
  599. data8 0 // utimes
  600. data8 0 // mknod
  601. data8 0 // chmod
  602. data8 0 // chown
  603. data8 0 // lseek // 1040
  604. data8 fsys_getpid // getpid
  605. data8 fsys_getppid // getppid
  606. data8 0 // mount
  607. data8 0 // umount
  608. data8 0 // setuid // 1045
  609. data8 0 // getuid
  610. data8 0 // geteuid
  611. data8 0 // ptrace
  612. data8 0 // access
  613. data8 0 // sync // 1050
  614. data8 0 // fsync
  615. data8 0 // fdatasync
  616. data8 0 // kill
  617. data8 0 // rename
  618. data8 0 // mkdir // 1055
  619. data8 0 // rmdir
  620. data8 0 // dup
  621. data8 0 // pipe
  622. data8 0 // times
  623. data8 0 // brk // 1060
  624. data8 0 // setgid
  625. data8 0 // getgid
  626. data8 0 // getegid
  627. data8 0 // acct
  628. data8 0 // ioctl // 1065
  629. data8 0 // fcntl
  630. data8 0 // umask
  631. data8 0 // chroot
  632. data8 0 // ustat
  633. data8 0 // dup2 // 1070
  634. data8 0 // setreuid
  635. data8 0 // setregid
  636. data8 0 // getresuid
  637. data8 0 // setresuid
  638. data8 0 // getresgid // 1075
  639. data8 0 // setresgid
  640. data8 0 // getgroups
  641. data8 0 // setgroups
  642. data8 0 // getpgid
  643. data8 0 // setpgid // 1080
  644. data8 0 // setsid
  645. data8 0 // getsid
  646. data8 0 // sethostname
  647. data8 0 // setrlimit
  648. data8 0 // getrlimit // 1085
  649. data8 0 // getrusage
  650. data8 fsys_gettimeofday // gettimeofday
  651. data8 0 // settimeofday
  652. data8 0 // select
  653. data8 0 // poll // 1090
  654. data8 0 // symlink
  655. data8 0 // readlink
  656. data8 0 // uselib
  657. data8 0 // swapon
  658. data8 0 // swapoff // 1095
  659. data8 0 // reboot
  660. data8 0 // truncate
  661. data8 0 // ftruncate
  662. data8 0 // fchmod
  663. data8 0 // fchown // 1100
  664. data8 0 // getpriority
  665. data8 0 // setpriority
  666. data8 0 // statfs
  667. data8 0 // fstatfs
  668. data8 0 // gettid // 1105
  669. data8 0 // semget
  670. data8 0 // semop
  671. data8 0 // semctl
  672. data8 0 // msgget
  673. data8 0 // msgsnd // 1110
  674. data8 0 // msgrcv
  675. data8 0 // msgctl
  676. data8 0 // shmget
  677. data8 0 // shmat
  678. data8 0 // shmdt // 1115
  679. data8 0 // shmctl
  680. data8 0 // syslog
  681. data8 0 // setitimer
  682. data8 0 // getitimer
  683. data8 0 // 1120
  684. data8 0
  685. data8 0
  686. data8 0 // vhangup
  687. data8 0 // lchown
  688. data8 0 // remap_file_pages // 1125
  689. data8 0 // wait4
  690. data8 0 // sysinfo
  691. data8 0 // clone
  692. data8 0 // setdomainname
  693. data8 0 // newuname // 1130
  694. data8 0 // adjtimex
  695. data8 0
  696. data8 0 // init_module
  697. data8 0 // delete_module
  698. data8 0 // 1135
  699. data8 0
  700. data8 0 // quotactl
  701. data8 0 // bdflush
  702. data8 0 // sysfs
  703. data8 0 // personality // 1140
  704. data8 0 // afs_syscall
  705. data8 0 // setfsuid
  706. data8 0 // setfsgid
  707. data8 0 // getdents
  708. data8 0 // flock // 1145
  709. data8 0 // readv
  710. data8 0 // writev
  711. data8 0 // pread64
  712. data8 0 // pwrite64
  713. data8 0 // sysctl // 1150
  714. data8 0 // mmap
  715. data8 0 // munmap
  716. data8 0 // mlock
  717. data8 0 // mlockall
  718. data8 0 // mprotect // 1155
  719. data8 0 // mremap
  720. data8 0 // msync
  721. data8 0 // munlock
  722. data8 0 // munlockall
  723. data8 0 // sched_getparam // 1160
  724. data8 0 // sched_setparam
  725. data8 0 // sched_getscheduler
  726. data8 0 // sched_setscheduler
  727. data8 0 // sched_yield
  728. data8 0 // sched_get_priority_max // 1165
  729. data8 0 // sched_get_priority_min
  730. data8 0 // sched_rr_get_interval
  731. data8 0 // nanosleep
  732. data8 0 // nfsservctl
  733. data8 0 // prctl // 1170
  734. data8 0 // getpagesize
  735. data8 0 // mmap2
  736. data8 0 // pciconfig_read
  737. data8 0 // pciconfig_write
  738. data8 0 // perfmonctl // 1175
  739. data8 0 // sigaltstack
  740. data8 0 // rt_sigaction
  741. data8 0 // rt_sigpending
  742. data8 fsys_rt_sigprocmask // rt_sigprocmask
  743. data8 0 // rt_sigqueueinfo // 1180
  744. data8 0 // rt_sigreturn
  745. data8 0 // rt_sigsuspend
  746. data8 0 // rt_sigtimedwait
  747. data8 0 // getcwd
  748. data8 0 // capget // 1185
  749. data8 0 // capset
  750. data8 0 // sendfile
  751. data8 0
  752. data8 0
  753. data8 0 // socket // 1190
  754. data8 0 // bind
  755. data8 0 // connect
  756. data8 0 // listen
  757. data8 0 // accept
  758. data8 0 // getsockname // 1195
  759. data8 0 // getpeername
  760. data8 0 // socketpair
  761. data8 0 // send
  762. data8 0 // sendto
  763. data8 0 // recv // 1200
  764. data8 0 // recvfrom
  765. data8 0 // shutdown
  766. data8 0 // setsockopt
  767. data8 0 // getsockopt
  768. data8 0 // sendmsg // 1205
  769. data8 0 // recvmsg
  770. data8 0 // pivot_root
  771. data8 0 // mincore
  772. data8 0 // madvise
  773. data8 0 // newstat // 1210
  774. data8 0 // newlstat
  775. data8 0 // newfstat
  776. data8 0 // clone2
  777. data8 0 // getdents64
  778. data8 0 // getunwind // 1215
  779. data8 0 // readahead
  780. data8 0 // setxattr
  781. data8 0 // lsetxattr
  782. data8 0 // fsetxattr
  783. data8 0 // getxattr // 1220
  784. data8 0 // lgetxattr
  785. data8 0 // fgetxattr
  786. data8 0 // listxattr
  787. data8 0 // llistxattr
  788. data8 0 // flistxattr // 1225
  789. data8 0 // removexattr
  790. data8 0 // lremovexattr
  791. data8 0 // fremovexattr
  792. data8 0 // tkill
  793. data8 0 // futex // 1230
  794. data8 0 // sched_setaffinity
  795. data8 0 // sched_getaffinity
  796. data8 fsys_set_tid_address // set_tid_address
  797. data8 0 // fadvise64_64
  798. data8 0 // tgkill // 1235
  799. data8 0 // exit_group
  800. data8 0 // lookup_dcookie
  801. data8 0 // io_setup
  802. data8 0 // io_destroy
  803. data8 0 // io_getevents // 1240
  804. data8 0 // io_submit
  805. data8 0 // io_cancel
  806. data8 0 // epoll_create
  807. data8 0 // epoll_ctl
  808. data8 0 // epoll_wait // 1245
  809. data8 0 // restart_syscall
  810. data8 0 // semtimedop
  811. data8 0 // timer_create
  812. data8 0 // timer_settime
  813. data8 0 // timer_gettime // 1250
  814. data8 0 // timer_getoverrun
  815. data8 0 // timer_delete
  816. data8 0 // clock_settime
  817. data8 fsys_clock_gettime // clock_gettime
  818. data8 0 // clock_getres // 1255
  819. data8 0 // clock_nanosleep
  820. data8 0 // fstatfs64
  821. data8 0 // statfs64
  822. data8 0
  823. data8 0 // 1260
  824. data8 0
  825. data8 0 // mq_open
  826. data8 0 // mq_unlink
  827. data8 0 // mq_timedsend
  828. data8 0 // mq_timedreceive // 1265
  829. data8 0 // mq_notify
  830. data8 0 // mq_getsetattr
  831. data8 0 // kexec_load
  832. data8 0
  833. data8 0 // 1270
  834. data8 0
  835. data8 0
  836. data8 0
  837. data8 0
  838. data8 0 // 1275
  839. data8 0
  840. data8 0
  841. data8 0
  842. data8 0
  843. .org fsyscall_table + 8*NR_syscalls // guard against failures to increase NR_syscalls