fsys.S 28 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988
  1. /*
  2. * This file contains the light-weight system call handlers (fsyscall-handlers).
  3. *
  4. * Copyright (C) 2003 Hewlett-Packard Co
  5. * David Mosberger-Tang <davidm@hpl.hp.com>
  6. *
  7. * 25-Sep-03 davidm Implement fsys_rt_sigprocmask().
  8. * 18-Feb-03 louisk Implement fsys_gettimeofday().
  9. * 28-Feb-03 davidm Fixed several bugs in fsys_gettimeofday(). Tuned it some more,
  10. * probably broke it along the way... ;-)
  11. * 13-Jul-04 clameter Implement fsys_clock_gettime and revise fsys_gettimeofday to make
  12. * it capable of using memory based clocks without falling back to C code.
  13. * 08-Feb-07 Fenghua Yu Implement fsys_getcpu.
  14. *
  15. */
  16. #include <asm/asmmacro.h>
  17. #include <asm/errno.h>
  18. #include <asm/asm-offsets.h>
  19. #include <asm/percpu.h>
  20. #include <asm/thread_info.h>
  21. #include <asm/sal.h>
  22. #include <asm/signal.h>
  23. #include <asm/system.h>
  24. #include <asm/unistd.h>
  25. #include "entry.h"
  26. /*
  27. * See Documentation/ia64/fsys.txt for details on fsyscalls.
  28. *
  29. * On entry to an fsyscall handler:
  30. * r10 = 0 (i.e., defaults to "successful syscall return")
  31. * r11 = saved ar.pfs (a user-level value)
  32. * r15 = system call number
  33. * r16 = "current" task pointer (in normal kernel-mode, this is in r13)
  34. * r32-r39 = system call arguments
  35. * b6 = return address (a user-level value)
  36. * ar.pfs = previous frame-state (a user-level value)
  37. * PSR.be = cleared to zero (i.e., little-endian byte order is in effect)
  38. * all other registers may contain values passed in from user-mode
  39. *
  40. * On return from an fsyscall handler:
  41. * r11 = saved ar.pfs (as passed into the fsyscall handler)
  42. * r15 = system call number (as passed into the fsyscall handler)
  43. * r32-r39 = system call arguments (as passed into the fsyscall handler)
  44. * b6 = return address (as passed into the fsyscall handler)
  45. * ar.pfs = previous frame-state (as passed into the fsyscall handler)
  46. */
  47. ENTRY(fsys_ni_syscall)
  48. .prologue
  49. .altrp b6
  50. .body
  51. mov r8=ENOSYS
  52. mov r10=-1
  53. FSYS_RETURN
  54. END(fsys_ni_syscall)
  55. ENTRY(fsys_getpid)
  56. .prologue
  57. .altrp b6
  58. .body
  59. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  60. ;;
  61. ld4 r9=[r9]
  62. add r8=IA64_TASK_TGID_OFFSET,r16
  63. ;;
  64. and r9=TIF_ALLWORK_MASK,r9
  65. ld4 r8=[r8] // r8 = current->tgid
  66. ;;
  67. cmp.ne p8,p0=0,r9
  68. (p8) br.spnt.many fsys_fallback_syscall
  69. FSYS_RETURN
  70. END(fsys_getpid)
  71. ENTRY(fsys_getppid)
  72. .prologue
  73. .altrp b6
  74. .body
  75. add r17=IA64_TASK_GROUP_LEADER_OFFSET,r16
  76. ;;
  77. ld8 r17=[r17] // r17 = current->group_leader
  78. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  79. ;;
  80. ld4 r9=[r9]
  81. add r17=IA64_TASK_REAL_PARENT_OFFSET,r17 // r17 = &current->group_leader->real_parent
  82. ;;
  83. and r9=TIF_ALLWORK_MASK,r9
  84. 1: ld8 r18=[r17] // r18 = current->group_leader->real_parent
  85. ;;
  86. cmp.ne p8,p0=0,r9
  87. add r8=IA64_TASK_TGID_OFFSET,r18 // r8 = &current->group_leader->real_parent->tgid
  88. ;;
  89. /*
  90. * The .acq is needed to ensure that the read of tgid has returned its data before
  91. * we re-check "real_parent".
  92. */
  93. ld4.acq r8=[r8] // r8 = current->group_leader->real_parent->tgid
  94. #ifdef CONFIG_SMP
  95. /*
  96. * Re-read current->group_leader->real_parent.
  97. */
  98. ld8 r19=[r17] // r19 = current->group_leader->real_parent
  99. (p8) br.spnt.many fsys_fallback_syscall
  100. ;;
  101. cmp.ne p6,p0=r18,r19 // did real_parent change?
  102. mov r19=0 // i must not leak kernel bits...
  103. (p6) br.cond.spnt.few 1b // yes -> redo the read of tgid and the check
  104. ;;
  105. mov r17=0 // i must not leak kernel bits...
  106. mov r18=0 // i must not leak kernel bits...
  107. #else
  108. mov r17=0 // i must not leak kernel bits...
  109. mov r18=0 // i must not leak kernel bits...
  110. mov r19=0 // i must not leak kernel bits...
  111. #endif
  112. FSYS_RETURN
  113. END(fsys_getppid)
  114. ENTRY(fsys_set_tid_address)
  115. .prologue
  116. .altrp b6
  117. .body
  118. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  119. ;;
  120. ld4 r9=[r9]
  121. tnat.z p6,p7=r32 // check argument register for being NaT
  122. ;;
  123. and r9=TIF_ALLWORK_MASK,r9
  124. add r8=IA64_TASK_PID_OFFSET,r16
  125. add r18=IA64_TASK_CLEAR_CHILD_TID_OFFSET,r16
  126. ;;
  127. ld4 r8=[r8]
  128. cmp.ne p8,p0=0,r9
  129. mov r17=-1
  130. ;;
  131. (p6) st8 [r18]=r32
  132. (p7) st8 [r18]=r17
  133. (p8) br.spnt.many fsys_fallback_syscall
  134. ;;
  135. mov r17=0 // i must not leak kernel bits...
  136. mov r18=0 // i must not leak kernel bits...
  137. FSYS_RETURN
  138. END(fsys_set_tid_address)
  139. #if IA64_GTOD_LOCK_OFFSET !=0
  140. #error fsys_gettimeofday incompatible with changes to struct fsyscall_gtod_data_t
  141. #endif
  142. #if IA64_ITC_JITTER_OFFSET !=0
  143. #error fsys_gettimeofday incompatible with changes to struct itc_jitter_data_t
  144. #endif
  145. #define CLOCK_REALTIME 0
  146. #define CLOCK_MONOTONIC 1
  147. #define CLOCK_DIVIDE_BY_1000 0x4000
  148. #define CLOCK_ADD_MONOTONIC 0x8000
  149. ENTRY(fsys_gettimeofday)
  150. .prologue
  151. .altrp b6
  152. .body
  153. mov r31 = r32
  154. tnat.nz p6,p0 = r33 // guard against NaT argument
  155. (p6) br.cond.spnt.few .fail_einval
  156. mov r30 = CLOCK_DIVIDE_BY_1000
  157. ;;
  158. .gettime:
  159. // Register map
  160. // Incoming r31 = pointer to address where to place result
  161. // r30 = flags determining how time is processed
  162. // r2,r3 = temp r4-r7 preserved
  163. // r8 = result nanoseconds
  164. // r9 = result seconds
  165. // r10 = temporary storage for clock difference
  166. // r11 = preserved: saved ar.pfs
  167. // r12 = preserved: memory stack
  168. // r13 = preserved: thread pointer
  169. // r14 = address of mask / mask value
  170. // r15 = preserved: system call number
  171. // r16 = preserved: current task pointer
  172. // r17 = (not used)
  173. // r18 = (not used)
  174. // r19 = address of itc_lastcycle
  175. // r20 = struct fsyscall_gtod_data (= address of gtod_lock.sequence)
  176. // r21 = address of mmio_ptr
  177. // r22 = address of wall_time or monotonic_time
  178. // r23 = address of shift / value
  179. // r24 = address mult factor / cycle_last value
  180. // r25 = itc_lastcycle value
  181. // r26 = address clocksource cycle_last
  182. // r27 = (not used)
  183. // r28 = sequence number at the beginning of critcal section
  184. // r29 = address of itc_jitter
  185. // r30 = time processing flags / memory address
  186. // r31 = pointer to result
  187. // Predicates
  188. // p6,p7 short term use
  189. // p8 = timesource ar.itc
  190. // p9 = timesource mmio64
  191. // p10 = timesource mmio32 - not used
  192. // p11 = timesource not to be handled by asm code
  193. // p12 = memory time source ( = p9 | p10) - not used
  194. // p13 = do cmpxchg with itc_lastcycle
  195. // p14 = Divide by 1000
  196. // p15 = Add monotonic
  197. //
  198. // Note that instructions are optimized for McKinley. McKinley can
  199. // process two bundles simultaneously and therefore we continuously
  200. // try to feed the CPU two bundles and then a stop.
  201. //
  202. // Additional note that code has changed a lot. Optimization is TBD.
  203. // Comments begin with "?" are maybe outdated.
  204. tnat.nz p6,p0 = r31 // ? branch deferred to fit later bundle
  205. mov pr = r30,0xc000 // Set predicates according to function
  206. add r2 = TI_FLAGS+IA64_TASK_SIZE,r16
  207. movl r20 = fsyscall_gtod_data // load fsyscall gettimeofday data address
  208. ;;
  209. movl r29 = itc_jitter_data // itc_jitter
  210. add r22 = IA64_GTOD_WALL_TIME_OFFSET,r20 // wall_time
  211. ld4 r2 = [r2] // process work pending flags
  212. ;;
  213. (p15) add r22 = IA64_GTOD_MONO_TIME_OFFSET,r20 // monotonic_time
  214. add r21 = IA64_CLKSRC_MMIO_OFFSET,r20
  215. add r19 = IA64_ITC_LASTCYCLE_OFFSET,r29
  216. and r2 = TIF_ALLWORK_MASK,r2
  217. (p6) br.cond.spnt.few .fail_einval // ? deferred branch
  218. ;;
  219. add r26 = IA64_CLKSRC_CYCLE_LAST_OFFSET,r20 // clksrc_cycle_last
  220. cmp.ne p6, p0 = 0, r2 // Fallback if work is scheduled
  221. (p6) br.cond.spnt.many fsys_fallback_syscall
  222. ;;
  223. // Begin critical section
  224. .time_redo:
  225. ld4.acq r28 = [r20] // gtod_lock.sequence, Must take first
  226. ;;
  227. and r28 = ~1,r28 // And make sequence even to force retry if odd
  228. ;;
  229. ld8 r30 = [r21] // clocksource->mmio_ptr
  230. add r24 = IA64_CLKSRC_MULT_OFFSET,r20
  231. ld4 r2 = [r29] // itc_jitter value
  232. add r23 = IA64_CLKSRC_SHIFT_OFFSET,r20
  233. add r14 = IA64_CLKSRC_MASK_OFFSET,r20
  234. ;;
  235. ld4 r3 = [r24] // clocksource mult value
  236. ld8 r14 = [r14] // clocksource mask value
  237. cmp.eq p8,p9 = 0,r30 // use cpu timer if no mmio_ptr
  238. ;;
  239. setf.sig f7 = r3 // Setup for mult scaling of counter
  240. (p8) cmp.ne p13,p0 = r2,r0 // need itc_jitter compensation, set p13
  241. ld4 r23 = [r23] // clocksource shift value
  242. ld8 r24 = [r26] // get clksrc_cycle_last value
  243. (p9) cmp.eq p13,p0 = 0,r30 // if mmio_ptr, clear p13 jitter control
  244. ;;
  245. .pred.rel.mutex p8,p9
  246. (p8) mov r2 = ar.itc // CPU_TIMER. 36 clocks latency!!!
  247. (p9) ld8 r2 = [r30] // MMIO_TIMER. Could also have latency issues..
  248. (p13) ld8 r25 = [r19] // get itc_lastcycle value
  249. ;; // ? could be removed by moving the last add upward
  250. ld8 r9 = [r22],IA64_TIMESPEC_TV_NSEC_OFFSET // tv_sec
  251. ;;
  252. ld8 r8 = [r22],-IA64_TIMESPEC_TV_NSEC_OFFSET // tv_nsec
  253. (p13) sub r3 = r25,r2 // Diff needed before comparison (thanks davidm)
  254. ;;
  255. (p13) cmp.gt.unc p6,p7 = r3,r0 // check if it is less than last. p6,p7 cleared
  256. sub r10 = r2,r24 // current_cycle - last_cycle
  257. ;;
  258. (p6) sub r10 = r25,r24 // time we got was less than last_cycle
  259. (p7) mov ar.ccv = r25 // more than last_cycle. Prep for cmpxchg
  260. ;;
  261. (p7) cmpxchg8.rel r3 = [r19],r2,ar.ccv
  262. ;;
  263. (p7) cmp.ne p7,p0 = r25,r3 // if cmpxchg not successful
  264. ;;
  265. (p7) sub r10 = r3,r24 // then use new last_cycle instead
  266. ;;
  267. and r10 = r10,r14 // Apply mask
  268. ;;
  269. setf.sig f8 = r10
  270. nop.i 123
  271. ;;
  272. // fault check takes 5 cycles and we have spare time
  273. EX(.fail_efault, probe.w.fault r31, 3)
  274. xmpy.l f8 = f8,f7 // nsec_per_cyc*(counter-last_counter)
  275. ;;
  276. // ? simulate tbit.nz.or p7,p0 = r28,0
  277. getf.sig r2 = f8
  278. mf
  279. ;;
  280. ld4 r10 = [r20] // gtod_lock.sequence
  281. shr.u r2 = r2,r23 // shift by factor
  282. ;; // ? overloaded 3 bundles!
  283. add r8 = r8,r2 // Add xtime.nsecs
  284. cmp4.ne p7,p0 = r28,r10
  285. (p7) br.cond.dpnt.few .time_redo // sequence number changed, redo
  286. // End critical section.
  287. // Now r8=tv->tv_nsec and r9=tv->tv_sec
  288. mov r10 = r0
  289. movl r2 = 1000000000
  290. add r23 = IA64_TIMESPEC_TV_NSEC_OFFSET, r31
  291. (p14) movl r3 = 2361183241434822607 // Prep for / 1000 hack
  292. ;;
  293. .time_normalize:
  294. mov r21 = r8
  295. cmp.ge p6,p0 = r8,r2
  296. (p14) shr.u r20 = r8, 3 // We can repeat this if necessary just wasting time
  297. ;;
  298. (p14) setf.sig f8 = r20
  299. (p6) sub r8 = r8,r2
  300. (p6) add r9 = 1,r9 // two nops before the branch.
  301. (p14) setf.sig f7 = r3 // Chances for repeats are 1 in 10000 for gettod
  302. (p6) br.cond.dpnt.few .time_normalize
  303. ;;
  304. // Divided by 8 though shift. Now divide by 125
  305. // The compiler was able to do that with a multiply
  306. // and a shift and we do the same
  307. EX(.fail_efault, probe.w.fault r23, 3) // This also costs 5 cycles
  308. (p14) xmpy.hu f8 = f8, f7 // xmpy has 5 cycles latency so use it
  309. ;;
  310. mov r8 = r0
  311. (p14) getf.sig r2 = f8
  312. ;;
  313. (p14) shr.u r21 = r2, 4
  314. ;;
  315. EX(.fail_efault, st8 [r31] = r9)
  316. EX(.fail_efault, st8 [r23] = r21)
  317. FSYS_RETURN
  318. .fail_einval:
  319. mov r8 = EINVAL
  320. mov r10 = -1
  321. FSYS_RETURN
  322. .fail_efault:
  323. mov r8 = EFAULT
  324. mov r10 = -1
  325. FSYS_RETURN
  326. END(fsys_gettimeofday)
  327. ENTRY(fsys_clock_gettime)
  328. .prologue
  329. .altrp b6
  330. .body
  331. cmp4.ltu p6, p0 = CLOCK_MONOTONIC, r32
  332. // Fallback if this is not CLOCK_REALTIME or CLOCK_MONOTONIC
  333. (p6) br.spnt.few fsys_fallback_syscall
  334. mov r31 = r33
  335. shl r30 = r32,15
  336. br.many .gettime
  337. END(fsys_clock_gettime)
  338. /*
  339. * long fsys_rt_sigprocmask (int how, sigset_t *set, sigset_t *oset, size_t sigsetsize).
  340. */
  341. #if _NSIG_WORDS != 1
  342. # error Sorry, fsys_rt_sigprocmask() needs to be updated for _NSIG_WORDS != 1.
  343. #endif
  344. ENTRY(fsys_rt_sigprocmask)
  345. .prologue
  346. .altrp b6
  347. .body
  348. add r2=IA64_TASK_BLOCKED_OFFSET,r16
  349. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  350. cmp4.ltu p6,p0=SIG_SETMASK,r32
  351. cmp.ne p15,p0=r0,r34 // oset != NULL?
  352. tnat.nz p8,p0=r34
  353. add r31=IA64_TASK_SIGHAND_OFFSET,r16
  354. ;;
  355. ld8 r3=[r2] // read/prefetch current->blocked
  356. ld4 r9=[r9]
  357. tnat.nz.or p6,p0=r35
  358. cmp.ne.or p6,p0=_NSIG_WORDS*8,r35
  359. tnat.nz.or p6,p0=r32
  360. (p6) br.spnt.few .fail_einval // fail with EINVAL
  361. ;;
  362. #ifdef CONFIG_SMP
  363. ld8 r31=[r31] // r31 <- current->sighand
  364. #endif
  365. and r9=TIF_ALLWORK_MASK,r9
  366. tnat.nz.or p8,p0=r33
  367. ;;
  368. cmp.ne p7,p0=0,r9
  369. cmp.eq p6,p0=r0,r33 // set == NULL?
  370. add r31=IA64_SIGHAND_SIGLOCK_OFFSET,r31 // r31 <- current->sighand->siglock
  371. (p8) br.spnt.few .fail_efault // fail with EFAULT
  372. (p7) br.spnt.many fsys_fallback_syscall // got pending kernel work...
  373. (p6) br.dpnt.many .store_mask // -> short-circuit to just reading the signal mask
  374. /* Argh, we actually have to do some work and _update_ the signal mask: */
  375. EX(.fail_efault, probe.r.fault r33, 3) // verify user has read-access to *set
  376. EX(.fail_efault, ld8 r14=[r33]) // r14 <- *set
  377. mov r17=(1 << (SIGKILL - 1)) | (1 << (SIGSTOP - 1))
  378. ;;
  379. rsm psr.i // mask interrupt delivery
  380. mov ar.ccv=0
  381. andcm r14=r14,r17 // filter out SIGKILL & SIGSTOP
  382. #ifdef CONFIG_SMP
  383. mov r17=1
  384. ;;
  385. cmpxchg4.acq r18=[r31],r17,ar.ccv // try to acquire the lock
  386. mov r8=EINVAL // default to EINVAL
  387. ;;
  388. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  389. cmp4.ne p6,p0=r18,r0
  390. (p6) br.cond.spnt.many .lock_contention
  391. ;;
  392. #else
  393. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  394. mov r8=EINVAL // default to EINVAL
  395. #endif
  396. add r18=IA64_TASK_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r16
  397. add r19=IA64_TASK_SIGNAL_OFFSET,r16
  398. cmp4.eq p6,p0=SIG_BLOCK,r32
  399. ;;
  400. ld8 r19=[r19] // r19 <- current->signal
  401. cmp4.eq p7,p0=SIG_UNBLOCK,r32
  402. cmp4.eq p8,p0=SIG_SETMASK,r32
  403. ;;
  404. ld8 r18=[r18] // r18 <- current->pending.signal
  405. .pred.rel.mutex p6,p7,p8
  406. (p6) or r14=r3,r14 // SIG_BLOCK
  407. (p7) andcm r14=r3,r14 // SIG_UNBLOCK
  408. (p8) mov r14=r14 // SIG_SETMASK
  409. (p6) mov r8=0 // clear error code
  410. // recalc_sigpending()
  411. add r17=IA64_SIGNAL_GROUP_STOP_COUNT_OFFSET,r19
  412. add r19=IA64_SIGNAL_SHARED_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r19
  413. ;;
  414. ld4 r17=[r17] // r17 <- current->signal->group_stop_count
  415. (p7) mov r8=0 // clear error code
  416. ld8 r19=[r19] // r19 <- current->signal->shared_pending
  417. ;;
  418. cmp4.gt p6,p7=r17,r0 // p6/p7 <- (current->signal->group_stop_count > 0)?
  419. (p8) mov r8=0 // clear error code
  420. or r18=r18,r19 // r18 <- current->pending | current->signal->shared_pending
  421. ;;
  422. // r18 <- (current->pending | current->signal->shared_pending) & ~current->blocked:
  423. andcm r18=r18,r14
  424. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  425. ;;
  426. (p7) cmp.ne.or.andcm p6,p7=r18,r0 // p6/p7 <- signal pending
  427. mov r19=0 // i must not leak kernel bits...
  428. (p6) br.cond.dpnt.many .sig_pending
  429. ;;
  430. 1: ld4 r17=[r9] // r17 <- current->thread_info->flags
  431. ;;
  432. mov ar.ccv=r17
  433. and r18=~_TIF_SIGPENDING,r17 // r18 <- r17 & ~(1 << TIF_SIGPENDING)
  434. ;;
  435. st8 [r2]=r14 // update current->blocked with new mask
  436. cmpxchg4.acq r8=[r9],r18,ar.ccv // current->thread_info->flags <- r18
  437. ;;
  438. cmp.ne p6,p0=r17,r8 // update failed?
  439. (p6) br.cond.spnt.few 1b // yes -> retry
  440. #ifdef CONFIG_SMP
  441. st4.rel [r31]=r0 // release the lock
  442. #endif
  443. ssm psr.i
  444. ;;
  445. srlz.d // ensure psr.i is set again
  446. mov r18=0 // i must not leak kernel bits...
  447. .store_mask:
  448. EX(.fail_efault, (p15) probe.w.fault r34, 3) // verify user has write-access to *oset
  449. EX(.fail_efault, (p15) st8 [r34]=r3)
  450. mov r2=0 // i must not leak kernel bits...
  451. mov r3=0 // i must not leak kernel bits...
  452. mov r8=0 // return 0
  453. mov r9=0 // i must not leak kernel bits...
  454. mov r14=0 // i must not leak kernel bits...
  455. mov r17=0 // i must not leak kernel bits...
  456. mov r31=0 // i must not leak kernel bits...
  457. FSYS_RETURN
  458. .sig_pending:
  459. #ifdef CONFIG_SMP
  460. st4.rel [r31]=r0 // release the lock
  461. #endif
  462. ssm psr.i
  463. ;;
  464. srlz.d
  465. br.sptk.many fsys_fallback_syscall // with signal pending, do the heavy-weight syscall
  466. #ifdef CONFIG_SMP
  467. .lock_contention:
  468. /* Rather than spinning here, fall back on doing a heavy-weight syscall. */
  469. ssm psr.i
  470. ;;
  471. srlz.d
  472. br.sptk.many fsys_fallback_syscall
  473. #endif
  474. END(fsys_rt_sigprocmask)
  475. /*
  476. * fsys_getcpu doesn't use the third parameter in this implementation. It reads
  477. * current_thread_info()->cpu and corresponding node in cpu_to_node_map.
  478. */
  479. ENTRY(fsys_getcpu)
  480. .prologue
  481. .altrp b6
  482. .body
  483. ;;
  484. add r2=TI_FLAGS+IA64_TASK_SIZE,r16
  485. tnat.nz p6,p0 = r32 // guard against NaT argument
  486. add r3=TI_CPU+IA64_TASK_SIZE,r16
  487. ;;
  488. ld4 r3=[r3] // M r3 = thread_info->cpu
  489. ld4 r2=[r2] // M r2 = thread_info->flags
  490. (p6) br.cond.spnt.few .fail_einval // B
  491. ;;
  492. tnat.nz p7,p0 = r33 // I guard against NaT argument
  493. (p7) br.cond.spnt.few .fail_einval // B
  494. #ifdef CONFIG_NUMA
  495. movl r17=cpu_to_node_map
  496. ;;
  497. EX(.fail_efault, probe.w.fault r32, 3) // M This takes 5 cycles
  498. EX(.fail_efault, probe.w.fault r33, 3) // M This takes 5 cycles
  499. shladd r18=r3,1,r17
  500. ;;
  501. ld2 r20=[r18] // r20 = cpu_to_node_map[cpu]
  502. and r2 = TIF_ALLWORK_MASK,r2
  503. ;;
  504. cmp.ne p8,p0=0,r2
  505. (p8) br.spnt.many fsys_fallback_syscall
  506. ;;
  507. ;;
  508. EX(.fail_efault, st4 [r32] = r3)
  509. EX(.fail_efault, st2 [r33] = r20)
  510. mov r8=0
  511. ;;
  512. #else
  513. EX(.fail_efault, probe.w.fault r32, 3) // M This takes 5 cycles
  514. EX(.fail_efault, probe.w.fault r33, 3) // M This takes 5 cycles
  515. and r2 = TIF_ALLWORK_MASK,r2
  516. ;;
  517. cmp.ne p8,p0=0,r2
  518. (p8) br.spnt.many fsys_fallback_syscall
  519. ;;
  520. EX(.fail_efault, st4 [r32] = r3)
  521. EX(.fail_efault, st2 [r33] = r0)
  522. mov r8=0
  523. ;;
  524. #endif
  525. FSYS_RETURN
  526. END(fsys_getcpu)
  527. ENTRY(fsys_fallback_syscall)
  528. .prologue
  529. .altrp b6
  530. .body
  531. /*
  532. * We only get here from light-weight syscall handlers. Thus, we already
  533. * know that r15 contains a valid syscall number. No need to re-check.
  534. */
  535. adds r17=-1024,r15
  536. movl r14=sys_call_table
  537. ;;
  538. rsm psr.i
  539. shladd r18=r17,3,r14
  540. ;;
  541. ld8 r18=[r18] // load normal (heavy-weight) syscall entry-point
  542. mov r29=psr // read psr (12 cyc load latency)
  543. mov r27=ar.rsc
  544. mov r21=ar.fpsr
  545. mov r26=ar.pfs
  546. END(fsys_fallback_syscall)
  547. /* FALL THROUGH */
  548. GLOBAL_ENTRY(fsys_bubble_down)
  549. .prologue
  550. .altrp b6
  551. .body
  552. /*
  553. * We get here for syscalls that don't have a lightweight
  554. * handler. For those, we need to bubble down into the kernel
  555. * and that requires setting up a minimal pt_regs structure,
  556. * and initializing the CPU state more or less as if an
  557. * interruption had occurred. To make syscall-restarts work,
  558. * we setup pt_regs such that cr_iip points to the second
  559. * instruction in syscall_via_break. Decrementing the IP
  560. * hence will restart the syscall via break and not
  561. * decrementing IP will return us to the caller, as usual.
  562. * Note that we preserve the value of psr.pp rather than
  563. * initializing it from dcr.pp. This makes it possible to
  564. * distinguish fsyscall execution from other privileged
  565. * execution.
  566. *
  567. * On entry:
  568. * - normal fsyscall handler register usage, except
  569. * that we also have:
  570. * - r18: address of syscall entry point
  571. * - r21: ar.fpsr
  572. * - r26: ar.pfs
  573. * - r27: ar.rsc
  574. * - r29: psr
  575. *
  576. * We used to clear some PSR bits here but that requires slow
  577. * serialization. Fortuntely, that isn't really necessary.
  578. * The rationale is as follows: we used to clear bits
  579. * ~PSR_PRESERVED_BITS in PSR.L. Since
  580. * PSR_PRESERVED_BITS==PSR.{UP,MFL,MFH,PK,DT,PP,SP,RT,IC}, we
  581. * ended up clearing PSR.{BE,AC,I,DFL,DFH,DI,DB,SI,TB}.
  582. * However,
  583. *
  584. * PSR.BE : already is turned off in __kernel_syscall_via_epc()
  585. * PSR.AC : don't care (kernel normally turns PSR.AC on)
  586. * PSR.I : already turned off by the time fsys_bubble_down gets
  587. * invoked
  588. * PSR.DFL: always 0 (kernel never turns it on)
  589. * PSR.DFH: don't care --- kernel never touches f32-f127 on its own
  590. * initiative
  591. * PSR.DI : always 0 (kernel never turns it on)
  592. * PSR.SI : always 0 (kernel never turns it on)
  593. * PSR.DB : don't care --- kernel never enables kernel-level
  594. * breakpoints
  595. * PSR.TB : must be 0 already; if it wasn't zero on entry to
  596. * __kernel_syscall_via_epc, the branch to fsys_bubble_down
  597. * will trigger a taken branch; the taken-trap-handler then
  598. * converts the syscall into a break-based system-call.
  599. */
  600. /*
  601. * Reading psr.l gives us only bits 0-31, psr.it, and psr.mc.
  602. * The rest we have to synthesize.
  603. */
  604. # define PSR_ONE_BITS ((3 << IA64_PSR_CPL0_BIT) \
  605. | (0x1 << IA64_PSR_RI_BIT) \
  606. | IA64_PSR_BN | IA64_PSR_I)
  607. invala // M0|1
  608. movl r14=ia64_ret_from_syscall // X
  609. nop.m 0
  610. movl r28=__kernel_syscall_via_break // X create cr.iip
  611. ;;
  612. mov r2=r16 // A get task addr to addl-addressable register
  613. adds r16=IA64_TASK_THREAD_ON_USTACK_OFFSET,r16 // A
  614. mov r31=pr // I0 save pr (2 cyc)
  615. ;;
  616. st1 [r16]=r0 // M2|3 clear current->thread.on_ustack flag
  617. addl r22=IA64_RBS_OFFSET,r2 // A compute base of RBS
  618. add r3=TI_FLAGS+IA64_TASK_SIZE,r2 // A
  619. ;;
  620. ld4 r3=[r3] // M0|1 r3 = current_thread_info()->flags
  621. lfetch.fault.excl.nt1 [r22] // M0|1 prefetch register backing-store
  622. nop.i 0
  623. ;;
  624. mov ar.rsc=0 // M2 set enforced lazy mode, pl 0, LE, loadrs=0
  625. nop.m 0
  626. nop.i 0
  627. ;;
  628. mov r23=ar.bspstore // M2 (12 cyc) save ar.bspstore
  629. mov.m r24=ar.rnat // M2 (5 cyc) read ar.rnat (dual-issues!)
  630. nop.i 0
  631. ;;
  632. mov ar.bspstore=r22 // M2 (6 cyc) switch to kernel RBS
  633. movl r8=PSR_ONE_BITS // X
  634. ;;
  635. mov r25=ar.unat // M2 (5 cyc) save ar.unat
  636. mov r19=b6 // I0 save b6 (2 cyc)
  637. mov r20=r1 // A save caller's gp in r20
  638. ;;
  639. or r29=r8,r29 // A construct cr.ipsr value to save
  640. mov b6=r18 // I0 copy syscall entry-point to b6 (7 cyc)
  641. addl r1=IA64_STK_OFFSET-IA64_PT_REGS_SIZE,r2 // A compute base of memory stack
  642. mov r18=ar.bsp // M2 save (kernel) ar.bsp (12 cyc)
  643. cmp.ne pKStk,pUStk=r0,r0 // A set pKStk <- 0, pUStk <- 1
  644. br.call.sptk.many b7=ia64_syscall_setup // B
  645. ;;
  646. mov ar.rsc=0x3 // M2 set eager mode, pl 0, LE, loadrs=0
  647. mov rp=r14 // I0 set the real return addr
  648. and r3=_TIF_SYSCALL_TRACEAUDIT,r3 // A
  649. ;;
  650. ssm psr.i // M2 we're on kernel stacks now, reenable irqs
  651. cmp.eq p8,p0=r3,r0 // A
  652. (p10) br.cond.spnt.many ia64_ret_from_syscall // B return if bad call-frame or r15 is a NaT
  653. nop.m 0
  654. (p8) br.call.sptk.many b6=b6 // B (ignore return address)
  655. br.cond.spnt ia64_trace_syscall // B
  656. END(fsys_bubble_down)
  657. .rodata
  658. .align 8
  659. .globl fsyscall_table
  660. data8 fsys_bubble_down
  661. fsyscall_table:
  662. data8 fsys_ni_syscall
  663. data8 0 // exit // 1025
  664. data8 0 // read
  665. data8 0 // write
  666. data8 0 // open
  667. data8 0 // close
  668. data8 0 // creat // 1030
  669. data8 0 // link
  670. data8 0 // unlink
  671. data8 0 // execve
  672. data8 0 // chdir
  673. data8 0 // fchdir // 1035
  674. data8 0 // utimes
  675. data8 0 // mknod
  676. data8 0 // chmod
  677. data8 0 // chown
  678. data8 0 // lseek // 1040
  679. data8 fsys_getpid // getpid
  680. data8 fsys_getppid // getppid
  681. data8 0 // mount
  682. data8 0 // umount
  683. data8 0 // setuid // 1045
  684. data8 0 // getuid
  685. data8 0 // geteuid
  686. data8 0 // ptrace
  687. data8 0 // access
  688. data8 0 // sync // 1050
  689. data8 0 // fsync
  690. data8 0 // fdatasync
  691. data8 0 // kill
  692. data8 0 // rename
  693. data8 0 // mkdir // 1055
  694. data8 0 // rmdir
  695. data8 0 // dup
  696. data8 0 // pipe
  697. data8 0 // times
  698. data8 0 // brk // 1060
  699. data8 0 // setgid
  700. data8 0 // getgid
  701. data8 0 // getegid
  702. data8 0 // acct
  703. data8 0 // ioctl // 1065
  704. data8 0 // fcntl
  705. data8 0 // umask
  706. data8 0 // chroot
  707. data8 0 // ustat
  708. data8 0 // dup2 // 1070
  709. data8 0 // setreuid
  710. data8 0 // setregid
  711. data8 0 // getresuid
  712. data8 0 // setresuid
  713. data8 0 // getresgid // 1075
  714. data8 0 // setresgid
  715. data8 0 // getgroups
  716. data8 0 // setgroups
  717. data8 0 // getpgid
  718. data8 0 // setpgid // 1080
  719. data8 0 // setsid
  720. data8 0 // getsid
  721. data8 0 // sethostname
  722. data8 0 // setrlimit
  723. data8 0 // getrlimit // 1085
  724. data8 0 // getrusage
  725. data8 fsys_gettimeofday // gettimeofday
  726. data8 0 // settimeofday
  727. data8 0 // select
  728. data8 0 // poll // 1090
  729. data8 0 // symlink
  730. data8 0 // readlink
  731. data8 0 // uselib
  732. data8 0 // swapon
  733. data8 0 // swapoff // 1095
  734. data8 0 // reboot
  735. data8 0 // truncate
  736. data8 0 // ftruncate
  737. data8 0 // fchmod
  738. data8 0 // fchown // 1100
  739. data8 0 // getpriority
  740. data8 0 // setpriority
  741. data8 0 // statfs
  742. data8 0 // fstatfs
  743. data8 0 // gettid // 1105
  744. data8 0 // semget
  745. data8 0 // semop
  746. data8 0 // semctl
  747. data8 0 // msgget
  748. data8 0 // msgsnd // 1110
  749. data8 0 // msgrcv
  750. data8 0 // msgctl
  751. data8 0 // shmget
  752. data8 0 // shmat
  753. data8 0 // shmdt // 1115
  754. data8 0 // shmctl
  755. data8 0 // syslog
  756. data8 0 // setitimer
  757. data8 0 // getitimer
  758. data8 0 // 1120
  759. data8 0
  760. data8 0
  761. data8 0 // vhangup
  762. data8 0 // lchown
  763. data8 0 // remap_file_pages // 1125
  764. data8 0 // wait4
  765. data8 0 // sysinfo
  766. data8 0 // clone
  767. data8 0 // setdomainname
  768. data8 0 // newuname // 1130
  769. data8 0 // adjtimex
  770. data8 0
  771. data8 0 // init_module
  772. data8 0 // delete_module
  773. data8 0 // 1135
  774. data8 0
  775. data8 0 // quotactl
  776. data8 0 // bdflush
  777. data8 0 // sysfs
  778. data8 0 // personality // 1140
  779. data8 0 // afs_syscall
  780. data8 0 // setfsuid
  781. data8 0 // setfsgid
  782. data8 0 // getdents
  783. data8 0 // flock // 1145
  784. data8 0 // readv
  785. data8 0 // writev
  786. data8 0 // pread64
  787. data8 0 // pwrite64
  788. data8 0 // sysctl // 1150
  789. data8 0 // mmap
  790. data8 0 // munmap
  791. data8 0 // mlock
  792. data8 0 // mlockall
  793. data8 0 // mprotect // 1155
  794. data8 0 // mremap
  795. data8 0 // msync
  796. data8 0 // munlock
  797. data8 0 // munlockall
  798. data8 0 // sched_getparam // 1160
  799. data8 0 // sched_setparam
  800. data8 0 // sched_getscheduler
  801. data8 0 // sched_setscheduler
  802. data8 0 // sched_yield
  803. data8 0 // sched_get_priority_max // 1165
  804. data8 0 // sched_get_priority_min
  805. data8 0 // sched_rr_get_interval
  806. data8 0 // nanosleep
  807. data8 0 // nfsservctl
  808. data8 0 // prctl // 1170
  809. data8 0 // getpagesize
  810. data8 0 // mmap2
  811. data8 0 // pciconfig_read
  812. data8 0 // pciconfig_write
  813. data8 0 // perfmonctl // 1175
  814. data8 0 // sigaltstack
  815. data8 0 // rt_sigaction
  816. data8 0 // rt_sigpending
  817. data8 fsys_rt_sigprocmask // rt_sigprocmask
  818. data8 0 // rt_sigqueueinfo // 1180
  819. data8 0 // rt_sigreturn
  820. data8 0 // rt_sigsuspend
  821. data8 0 // rt_sigtimedwait
  822. data8 0 // getcwd
  823. data8 0 // capget // 1185
  824. data8 0 // capset
  825. data8 0 // sendfile
  826. data8 0
  827. data8 0
  828. data8 0 // socket // 1190
  829. data8 0 // bind
  830. data8 0 // connect
  831. data8 0 // listen
  832. data8 0 // accept
  833. data8 0 // getsockname // 1195
  834. data8 0 // getpeername
  835. data8 0 // socketpair
  836. data8 0 // send
  837. data8 0 // sendto
  838. data8 0 // recv // 1200
  839. data8 0 // recvfrom
  840. data8 0 // shutdown
  841. data8 0 // setsockopt
  842. data8 0 // getsockopt
  843. data8 0 // sendmsg // 1205
  844. data8 0 // recvmsg
  845. data8 0 // pivot_root
  846. data8 0 // mincore
  847. data8 0 // madvise
  848. data8 0 // newstat // 1210
  849. data8 0 // newlstat
  850. data8 0 // newfstat
  851. data8 0 // clone2
  852. data8 0 // getdents64
  853. data8 0 // getunwind // 1215
  854. data8 0 // readahead
  855. data8 0 // setxattr
  856. data8 0 // lsetxattr
  857. data8 0 // fsetxattr
  858. data8 0 // getxattr // 1220
  859. data8 0 // lgetxattr
  860. data8 0 // fgetxattr
  861. data8 0 // listxattr
  862. data8 0 // llistxattr
  863. data8 0 // flistxattr // 1225
  864. data8 0 // removexattr
  865. data8 0 // lremovexattr
  866. data8 0 // fremovexattr
  867. data8 0 // tkill
  868. data8 0 // futex // 1230
  869. data8 0 // sched_setaffinity
  870. data8 0 // sched_getaffinity
  871. data8 fsys_set_tid_address // set_tid_address
  872. data8 0 // fadvise64_64
  873. data8 0 // tgkill // 1235
  874. data8 0 // exit_group
  875. data8 0 // lookup_dcookie
  876. data8 0 // io_setup
  877. data8 0 // io_destroy
  878. data8 0 // io_getevents // 1240
  879. data8 0 // io_submit
  880. data8 0 // io_cancel
  881. data8 0 // epoll_create
  882. data8 0 // epoll_ctl
  883. data8 0 // epoll_wait // 1245
  884. data8 0 // restart_syscall
  885. data8 0 // semtimedop
  886. data8 0 // timer_create
  887. data8 0 // timer_settime
  888. data8 0 // timer_gettime // 1250
  889. data8 0 // timer_getoverrun
  890. data8 0 // timer_delete
  891. data8 0 // clock_settime
  892. data8 fsys_clock_gettime // clock_gettime
  893. data8 0 // clock_getres // 1255
  894. data8 0 // clock_nanosleep
  895. data8 0 // fstatfs64
  896. data8 0 // statfs64
  897. data8 0 // mbind
  898. data8 0 // get_mempolicy // 1260
  899. data8 0 // set_mempolicy
  900. data8 0 // mq_open
  901. data8 0 // mq_unlink
  902. data8 0 // mq_timedsend
  903. data8 0 // mq_timedreceive // 1265
  904. data8 0 // mq_notify
  905. data8 0 // mq_getsetattr
  906. data8 0 // kexec_load
  907. data8 0 // vserver
  908. data8 0 // waitid // 1270
  909. data8 0 // add_key
  910. data8 0 // request_key
  911. data8 0 // keyctl
  912. data8 0 // ioprio_set
  913. data8 0 // ioprio_get // 1275
  914. data8 0 // move_pages
  915. data8 0 // inotify_init
  916. data8 0 // inotify_add_watch
  917. data8 0 // inotify_rm_watch
  918. data8 0 // migrate_pages // 1280
  919. data8 0 // openat
  920. data8 0 // mkdirat
  921. data8 0 // mknodat
  922. data8 0 // fchownat
  923. data8 0 // futimesat // 1285
  924. data8 0 // newfstatat
  925. data8 0 // unlinkat
  926. data8 0 // renameat
  927. data8 0 // linkat
  928. data8 0 // symlinkat // 1290
  929. data8 0 // readlinkat
  930. data8 0 // fchmodat
  931. data8 0 // faccessat
  932. data8 0
  933. data8 0 // 1295
  934. data8 0 // unshare
  935. data8 0 // splice
  936. data8 0 // set_robust_list
  937. data8 0 // get_robust_list
  938. data8 0 // sync_file_range // 1300
  939. data8 0 // tee
  940. data8 0 // vmsplice
  941. data8 0
  942. data8 fsys_getcpu // getcpu // 1304
  943. // fill in zeros for the remaining entries
  944. .zero:
  945. .space fsyscall_table + 8*NR_syscalls - .zero, 0