fsys.S 30 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037
  1. /*
  2. * This file contains the light-weight system call handlers (fsyscall-handlers).
  3. *
  4. * Copyright (C) 2003 Hewlett-Packard Co
  5. * David Mosberger-Tang <davidm@hpl.hp.com>
  6. *
  7. * 25-Sep-03 davidm Implement fsys_rt_sigprocmask().
  8. * 18-Feb-03 louisk Implement fsys_gettimeofday().
  9. * 28-Feb-03 davidm Fixed several bugs in fsys_gettimeofday(). Tuned it some more,
  10. * probably broke it along the way... ;-)
  11. * 13-Jul-04 clameter Implement fsys_clock_gettime and revise fsys_gettimeofday to make
  12. * it capable of using memory based clocks without falling back to C code.
  13. * 08-Feb-07 Fenghua Yu Implement fsys_getcpu.
  14. *
  15. */
  16. #include <asm/asmmacro.h>
  17. #include <asm/errno.h>
  18. #include <asm/asm-offsets.h>
  19. #include <asm/percpu.h>
  20. #include <asm/thread_info.h>
  21. #include <asm/sal.h>
  22. #include <asm/signal.h>
  23. #include <asm/system.h>
  24. #include <asm/unistd.h>
  25. #include "entry.h"
  26. #include "paravirt_inst.h"
  27. /*
  28. * See Documentation/ia64/fsys.txt for details on fsyscalls.
  29. *
  30. * On entry to an fsyscall handler:
  31. * r10 = 0 (i.e., defaults to "successful syscall return")
  32. * r11 = saved ar.pfs (a user-level value)
  33. * r15 = system call number
  34. * r16 = "current" task pointer (in normal kernel-mode, this is in r13)
  35. * r32-r39 = system call arguments
  36. * b6 = return address (a user-level value)
  37. * ar.pfs = previous frame-state (a user-level value)
  38. * PSR.be = cleared to zero (i.e., little-endian byte order is in effect)
  39. * all other registers may contain values passed in from user-mode
  40. *
  41. * On return from an fsyscall handler:
  42. * r11 = saved ar.pfs (as passed into the fsyscall handler)
  43. * r15 = system call number (as passed into the fsyscall handler)
  44. * r32-r39 = system call arguments (as passed into the fsyscall handler)
  45. * b6 = return address (as passed into the fsyscall handler)
  46. * ar.pfs = previous frame-state (as passed into the fsyscall handler)
  47. */
  48. ENTRY(fsys_ni_syscall)
  49. .prologue
  50. .altrp b6
  51. .body
  52. mov r8=ENOSYS
  53. mov r10=-1
  54. FSYS_RETURN
  55. END(fsys_ni_syscall)
  56. ENTRY(fsys_getpid)
  57. .prologue
  58. .altrp b6
  59. .body
  60. add r17=IA64_TASK_GROUP_LEADER_OFFSET,r16
  61. ;;
  62. ld8 r17=[r17] // r17 = current->group_leader
  63. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  64. ;;
  65. ld4 r9=[r9]
  66. add r17=IA64_TASK_TGIDLINK_OFFSET,r17
  67. ;;
  68. and r9=TIF_ALLWORK_MASK,r9
  69. ld8 r17=[r17] // r17 = current->group_leader->pids[PIDTYPE_PID].pid
  70. ;;
  71. add r8=IA64_PID_LEVEL_OFFSET,r17
  72. ;;
  73. ld4 r8=[r8] // r8 = pid->level
  74. add r17=IA64_PID_UPID_OFFSET,r17 // r17 = &pid->numbers[0]
  75. ;;
  76. shl r8=r8,IA64_UPID_SHIFT
  77. ;;
  78. add r17=r17,r8 // r17 = &pid->numbers[pid->level]
  79. ;;
  80. ld4 r8=[r17] // r8 = pid->numbers[pid->level].nr
  81. ;;
  82. mov r17=0
  83. ;;
  84. cmp.ne p8,p0=0,r9
  85. (p8) br.spnt.many fsys_fallback_syscall
  86. FSYS_RETURN
  87. END(fsys_getpid)
  88. ENTRY(fsys_getppid)
  89. .prologue
  90. .altrp b6
  91. .body
  92. add r17=IA64_TASK_GROUP_LEADER_OFFSET,r16
  93. ;;
  94. ld8 r17=[r17] // r17 = current->group_leader
  95. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  96. ;;
  97. ld4 r9=[r9]
  98. add r17=IA64_TASK_REAL_PARENT_OFFSET,r17 // r17 = &current->group_leader->real_parent
  99. ;;
  100. and r9=TIF_ALLWORK_MASK,r9
  101. 1: ld8 r18=[r17] // r18 = current->group_leader->real_parent
  102. ;;
  103. cmp.ne p8,p0=0,r9
  104. add r8=IA64_TASK_TGID_OFFSET,r18 // r8 = &current->group_leader->real_parent->tgid
  105. ;;
  106. /*
  107. * The .acq is needed to ensure that the read of tgid has returned its data before
  108. * we re-check "real_parent".
  109. */
  110. ld4.acq r8=[r8] // r8 = current->group_leader->real_parent->tgid
  111. #ifdef CONFIG_SMP
  112. /*
  113. * Re-read current->group_leader->real_parent.
  114. */
  115. ld8 r19=[r17] // r19 = current->group_leader->real_parent
  116. (p8) br.spnt.many fsys_fallback_syscall
  117. ;;
  118. cmp.ne p6,p0=r18,r19 // did real_parent change?
  119. mov r19=0 // i must not leak kernel bits...
  120. (p6) br.cond.spnt.few 1b // yes -> redo the read of tgid and the check
  121. ;;
  122. mov r17=0 // i must not leak kernel bits...
  123. mov r18=0 // i must not leak kernel bits...
  124. #else
  125. mov r17=0 // i must not leak kernel bits...
  126. mov r18=0 // i must not leak kernel bits...
  127. mov r19=0 // i must not leak kernel bits...
  128. #endif
  129. FSYS_RETURN
  130. END(fsys_getppid)
  131. ENTRY(fsys_set_tid_address)
  132. .prologue
  133. .altrp b6
  134. .body
  135. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  136. add r17=IA64_TASK_TGIDLINK_OFFSET,r16
  137. ;;
  138. ld4 r9=[r9]
  139. tnat.z p6,p7=r32 // check argument register for being NaT
  140. ld8 r17=[r17] // r17 = current->pids[PIDTYPE_PID].pid
  141. ;;
  142. and r9=TIF_ALLWORK_MASK,r9
  143. add r8=IA64_PID_LEVEL_OFFSET,r17
  144. add r18=IA64_TASK_CLEAR_CHILD_TID_OFFSET,r16
  145. ;;
  146. ld4 r8=[r8] // r8 = pid->level
  147. add r17=IA64_PID_UPID_OFFSET,r17 // r17 = &pid->numbers[0]
  148. ;;
  149. shl r8=r8,IA64_UPID_SHIFT
  150. ;;
  151. add r17=r17,r8 // r17 = &pid->numbers[pid->level]
  152. ;;
  153. ld4 r8=[r17] // r8 = pid->numbers[pid->level].nr
  154. ;;
  155. cmp.ne p8,p0=0,r9
  156. mov r17=-1
  157. ;;
  158. (p6) st8 [r18]=r32
  159. (p7) st8 [r18]=r17
  160. (p8) br.spnt.many fsys_fallback_syscall
  161. ;;
  162. mov r17=0 // i must not leak kernel bits...
  163. mov r18=0 // i must not leak kernel bits...
  164. FSYS_RETURN
  165. END(fsys_set_tid_address)
  166. #if IA64_GTOD_LOCK_OFFSET !=0
  167. #error fsys_gettimeofday incompatible with changes to struct fsyscall_gtod_data_t
  168. #endif
  169. #if IA64_ITC_JITTER_OFFSET !=0
  170. #error fsys_gettimeofday incompatible with changes to struct itc_jitter_data_t
  171. #endif
  172. #define CLOCK_REALTIME 0
  173. #define CLOCK_MONOTONIC 1
  174. #define CLOCK_DIVIDE_BY_1000 0x4000
  175. #define CLOCK_ADD_MONOTONIC 0x8000
  176. ENTRY(fsys_gettimeofday)
  177. .prologue
  178. .altrp b6
  179. .body
  180. mov r31 = r32
  181. tnat.nz p6,p0 = r33 // guard against NaT argument
  182. (p6) br.cond.spnt.few .fail_einval
  183. mov r30 = CLOCK_DIVIDE_BY_1000
  184. ;;
  185. .gettime:
  186. // Register map
  187. // Incoming r31 = pointer to address where to place result
  188. // r30 = flags determining how time is processed
  189. // r2,r3 = temp r4-r7 preserved
  190. // r8 = result nanoseconds
  191. // r9 = result seconds
  192. // r10 = temporary storage for clock difference
  193. // r11 = preserved: saved ar.pfs
  194. // r12 = preserved: memory stack
  195. // r13 = preserved: thread pointer
  196. // r14 = address of mask / mask value
  197. // r15 = preserved: system call number
  198. // r16 = preserved: current task pointer
  199. // r17 = (not used)
  200. // r18 = (not used)
  201. // r19 = address of itc_lastcycle
  202. // r20 = struct fsyscall_gtod_data (= address of gtod_lock.sequence)
  203. // r21 = address of mmio_ptr
  204. // r22 = address of wall_time or monotonic_time
  205. // r23 = address of shift / value
  206. // r24 = address mult factor / cycle_last value
  207. // r25 = itc_lastcycle value
  208. // r26 = address clocksource cycle_last
  209. // r27 = (not used)
  210. // r28 = sequence number at the beginning of critcal section
  211. // r29 = address of itc_jitter
  212. // r30 = time processing flags / memory address
  213. // r31 = pointer to result
  214. // Predicates
  215. // p6,p7 short term use
  216. // p8 = timesource ar.itc
  217. // p9 = timesource mmio64
  218. // p10 = timesource mmio32 - not used
  219. // p11 = timesource not to be handled by asm code
  220. // p12 = memory time source ( = p9 | p10) - not used
  221. // p13 = do cmpxchg with itc_lastcycle
  222. // p14 = Divide by 1000
  223. // p15 = Add monotonic
  224. //
  225. // Note that instructions are optimized for McKinley. McKinley can
  226. // process two bundles simultaneously and therefore we continuously
  227. // try to feed the CPU two bundles and then a stop.
  228. add r2 = TI_FLAGS+IA64_TASK_SIZE,r16
  229. tnat.nz p6,p0 = r31 // guard against Nat argument
  230. (p6) br.cond.spnt.few .fail_einval
  231. movl r20 = fsyscall_gtod_data // load fsyscall gettimeofday data address
  232. ;;
  233. ld4 r2 = [r2] // process work pending flags
  234. movl r29 = itc_jitter_data // itc_jitter
  235. add r22 = IA64_GTOD_WALL_TIME_OFFSET,r20 // wall_time
  236. add r21 = IA64_CLKSRC_MMIO_OFFSET,r20
  237. mov pr = r30,0xc000 // Set predicates according to function
  238. ;;
  239. and r2 = TIF_ALLWORK_MASK,r2
  240. add r19 = IA64_ITC_LASTCYCLE_OFFSET,r29
  241. (p15) add r22 = IA64_GTOD_MONO_TIME_OFFSET,r20 // monotonic_time
  242. ;;
  243. add r26 = IA64_CLKSRC_CYCLE_LAST_OFFSET,r20 // clksrc_cycle_last
  244. cmp.ne p6, p0 = 0, r2 // Fallback if work is scheduled
  245. (p6) br.cond.spnt.many fsys_fallback_syscall
  246. ;;
  247. // Begin critical section
  248. .time_redo:
  249. ld4.acq r28 = [r20] // gtod_lock.sequence, Must take first
  250. ;;
  251. and r28 = ~1,r28 // And make sequence even to force retry if odd
  252. ;;
  253. ld8 r30 = [r21] // clocksource->mmio_ptr
  254. add r24 = IA64_CLKSRC_MULT_OFFSET,r20
  255. ld4 r2 = [r29] // itc_jitter value
  256. add r23 = IA64_CLKSRC_SHIFT_OFFSET,r20
  257. add r14 = IA64_CLKSRC_MASK_OFFSET,r20
  258. ;;
  259. ld4 r3 = [r24] // clocksource mult value
  260. ld8 r14 = [r14] // clocksource mask value
  261. cmp.eq p8,p9 = 0,r30 // use cpu timer if no mmio_ptr
  262. ;;
  263. setf.sig f7 = r3 // Setup for mult scaling of counter
  264. (p8) cmp.ne p13,p0 = r2,r0 // need itc_jitter compensation, set p13
  265. ld4 r23 = [r23] // clocksource shift value
  266. ld8 r24 = [r26] // get clksrc_cycle_last value
  267. (p9) cmp.eq p13,p0 = 0,r30 // if mmio_ptr, clear p13 jitter control
  268. ;;
  269. .pred.rel.mutex p8,p9
  270. MOV_FROM_ITC(p8, p6, r2, r10) // CPU_TIMER. 36 clocks latency!!!
  271. (p9) ld8 r2 = [r30] // MMIO_TIMER. Could also have latency issues..
  272. (p13) ld8 r25 = [r19] // get itc_lastcycle value
  273. ld8 r9 = [r22],IA64_TIMESPEC_TV_NSEC_OFFSET // tv_sec
  274. ;;
  275. ld8 r8 = [r22],-IA64_TIMESPEC_TV_NSEC_OFFSET // tv_nsec
  276. (p13) sub r3 = r25,r2 // Diff needed before comparison (thanks davidm)
  277. ;;
  278. (p13) cmp.gt.unc p6,p7 = r3,r0 // check if it is less than last. p6,p7 cleared
  279. sub r10 = r2,r24 // current_cycle - last_cycle
  280. ;;
  281. (p6) sub r10 = r25,r24 // time we got was less than last_cycle
  282. (p7) mov ar.ccv = r25 // more than last_cycle. Prep for cmpxchg
  283. ;;
  284. (p7) cmpxchg8.rel r3 = [r19],r2,ar.ccv
  285. ;;
  286. (p7) cmp.ne p7,p0 = r25,r3 // if cmpxchg not successful
  287. ;;
  288. (p7) sub r10 = r3,r24 // then use new last_cycle instead
  289. ;;
  290. and r10 = r10,r14 // Apply mask
  291. ;;
  292. setf.sig f8 = r10
  293. nop.i 123
  294. ;;
  295. // fault check takes 5 cycles and we have spare time
  296. EX(.fail_efault, probe.w.fault r31, 3)
  297. xmpy.l f8 = f8,f7 // nsec_per_cyc*(counter-last_counter)
  298. ;;
  299. getf.sig r2 = f8
  300. mf
  301. ;;
  302. ld4 r10 = [r20] // gtod_lock.sequence
  303. shr.u r2 = r2,r23 // shift by factor
  304. ;;
  305. add r8 = r8,r2 // Add xtime.nsecs
  306. cmp4.ne p7,p0 = r28,r10
  307. (p7) br.cond.dpnt.few .time_redo // sequence number changed, redo
  308. // End critical section.
  309. // Now r8=tv->tv_nsec and r9=tv->tv_sec
  310. mov r10 = r0
  311. movl r2 = 1000000000
  312. add r23 = IA64_TIMESPEC_TV_NSEC_OFFSET, r31
  313. (p14) movl r3 = 2361183241434822607 // Prep for / 1000 hack
  314. ;;
  315. .time_normalize:
  316. mov r21 = r8
  317. cmp.ge p6,p0 = r8,r2
  318. (p14) shr.u r20 = r8, 3 // We can repeat this if necessary just wasting time
  319. ;;
  320. (p14) setf.sig f8 = r20
  321. (p6) sub r8 = r8,r2
  322. (p6) add r9 = 1,r9 // two nops before the branch.
  323. (p14) setf.sig f7 = r3 // Chances for repeats are 1 in 10000 for gettod
  324. (p6) br.cond.dpnt.few .time_normalize
  325. ;;
  326. // Divided by 8 though shift. Now divide by 125
  327. // The compiler was able to do that with a multiply
  328. // and a shift and we do the same
  329. EX(.fail_efault, probe.w.fault r23, 3) // This also costs 5 cycles
  330. (p14) xmpy.hu f8 = f8, f7 // xmpy has 5 cycles latency so use it
  331. ;;
  332. (p14) getf.sig r2 = f8
  333. ;;
  334. mov r8 = r0
  335. (p14) shr.u r21 = r2, 4
  336. ;;
  337. EX(.fail_efault, st8 [r31] = r9)
  338. EX(.fail_efault, st8 [r23] = r21)
  339. FSYS_RETURN
  340. .fail_einval:
  341. mov r8 = EINVAL
  342. mov r10 = -1
  343. FSYS_RETURN
  344. .fail_efault:
  345. mov r8 = EFAULT
  346. mov r10 = -1
  347. FSYS_RETURN
  348. END(fsys_gettimeofday)
  349. ENTRY(fsys_clock_gettime)
  350. .prologue
  351. .altrp b6
  352. .body
  353. cmp4.ltu p6, p0 = CLOCK_MONOTONIC, r32
  354. // Fallback if this is not CLOCK_REALTIME or CLOCK_MONOTONIC
  355. (p6) br.spnt.few fsys_fallback_syscall
  356. mov r31 = r33
  357. shl r30 = r32,15
  358. br.many .gettime
  359. END(fsys_clock_gettime)
  360. /*
  361. * long fsys_rt_sigprocmask (int how, sigset_t *set, sigset_t *oset, size_t sigsetsize).
  362. */
  363. #if _NSIG_WORDS != 1
  364. # error Sorry, fsys_rt_sigprocmask() needs to be updated for _NSIG_WORDS != 1.
  365. #endif
  366. ENTRY(fsys_rt_sigprocmask)
  367. .prologue
  368. .altrp b6
  369. .body
  370. add r2=IA64_TASK_BLOCKED_OFFSET,r16
  371. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  372. cmp4.ltu p6,p0=SIG_SETMASK,r32
  373. cmp.ne p15,p0=r0,r34 // oset != NULL?
  374. tnat.nz p8,p0=r34
  375. add r31=IA64_TASK_SIGHAND_OFFSET,r16
  376. ;;
  377. ld8 r3=[r2] // read/prefetch current->blocked
  378. ld4 r9=[r9]
  379. tnat.nz.or p6,p0=r35
  380. cmp.ne.or p6,p0=_NSIG_WORDS*8,r35
  381. tnat.nz.or p6,p0=r32
  382. (p6) br.spnt.few .fail_einval // fail with EINVAL
  383. ;;
  384. #ifdef CONFIG_SMP
  385. ld8 r31=[r31] // r31 <- current->sighand
  386. #endif
  387. and r9=TIF_ALLWORK_MASK,r9
  388. tnat.nz.or p8,p0=r33
  389. ;;
  390. cmp.ne p7,p0=0,r9
  391. cmp.eq p6,p0=r0,r33 // set == NULL?
  392. add r31=IA64_SIGHAND_SIGLOCK_OFFSET,r31 // r31 <- current->sighand->siglock
  393. (p8) br.spnt.few .fail_efault // fail with EFAULT
  394. (p7) br.spnt.many fsys_fallback_syscall // got pending kernel work...
  395. (p6) br.dpnt.many .store_mask // -> short-circuit to just reading the signal mask
  396. /* Argh, we actually have to do some work and _update_ the signal mask: */
  397. EX(.fail_efault, probe.r.fault r33, 3) // verify user has read-access to *set
  398. EX(.fail_efault, ld8 r14=[r33]) // r14 <- *set
  399. mov r17=(1 << (SIGKILL - 1)) | (1 << (SIGSTOP - 1))
  400. ;;
  401. RSM_PSR_I(p0, r18, r19) // mask interrupt delivery
  402. mov ar.ccv=0
  403. andcm r14=r14,r17 // filter out SIGKILL & SIGSTOP
  404. #ifdef CONFIG_SMP
  405. mov r17=1
  406. ;;
  407. cmpxchg4.acq r18=[r31],r17,ar.ccv // try to acquire the lock
  408. mov r8=EINVAL // default to EINVAL
  409. ;;
  410. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  411. cmp4.ne p6,p0=r18,r0
  412. (p6) br.cond.spnt.many .lock_contention
  413. ;;
  414. #else
  415. ld8 r3=[r2] // re-read current->blocked now that we hold the lock
  416. mov r8=EINVAL // default to EINVAL
  417. #endif
  418. add r18=IA64_TASK_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r16
  419. add r19=IA64_TASK_SIGNAL_OFFSET,r16
  420. cmp4.eq p6,p0=SIG_BLOCK,r32
  421. ;;
  422. ld8 r19=[r19] // r19 <- current->signal
  423. cmp4.eq p7,p0=SIG_UNBLOCK,r32
  424. cmp4.eq p8,p0=SIG_SETMASK,r32
  425. ;;
  426. ld8 r18=[r18] // r18 <- current->pending.signal
  427. .pred.rel.mutex p6,p7,p8
  428. (p6) or r14=r3,r14 // SIG_BLOCK
  429. (p7) andcm r14=r3,r14 // SIG_UNBLOCK
  430. (p8) mov r14=r14 // SIG_SETMASK
  431. (p6) mov r8=0 // clear error code
  432. // recalc_sigpending()
  433. add r17=IA64_SIGNAL_GROUP_STOP_COUNT_OFFSET,r19
  434. add r19=IA64_SIGNAL_SHARED_PENDING_OFFSET+IA64_SIGPENDING_SIGNAL_OFFSET,r19
  435. ;;
  436. ld4 r17=[r17] // r17 <- current->signal->group_stop_count
  437. (p7) mov r8=0 // clear error code
  438. ld8 r19=[r19] // r19 <- current->signal->shared_pending
  439. ;;
  440. cmp4.gt p6,p7=r17,r0 // p6/p7 <- (current->signal->group_stop_count > 0)?
  441. (p8) mov r8=0 // clear error code
  442. or r18=r18,r19 // r18 <- current->pending | current->signal->shared_pending
  443. ;;
  444. // r18 <- (current->pending | current->signal->shared_pending) & ~current->blocked:
  445. andcm r18=r18,r14
  446. add r9=TI_FLAGS+IA64_TASK_SIZE,r16
  447. ;;
  448. (p7) cmp.ne.or.andcm p6,p7=r18,r0 // p6/p7 <- signal pending
  449. mov r19=0 // i must not leak kernel bits...
  450. (p6) br.cond.dpnt.many .sig_pending
  451. ;;
  452. 1: ld4 r17=[r9] // r17 <- current->thread_info->flags
  453. ;;
  454. mov ar.ccv=r17
  455. and r18=~_TIF_SIGPENDING,r17 // r18 <- r17 & ~(1 << TIF_SIGPENDING)
  456. ;;
  457. st8 [r2]=r14 // update current->blocked with new mask
  458. cmpxchg4.acq r8=[r9],r18,ar.ccv // current->thread_info->flags <- r18
  459. ;;
  460. cmp.ne p6,p0=r17,r8 // update failed?
  461. (p6) br.cond.spnt.few 1b // yes -> retry
  462. #ifdef CONFIG_SMP
  463. st4.rel [r31]=r0 // release the lock
  464. #endif
  465. SSM_PSR_I(p0, p9, r31)
  466. ;;
  467. srlz.d // ensure psr.i is set again
  468. mov r18=0 // i must not leak kernel bits...
  469. .store_mask:
  470. EX(.fail_efault, (p15) probe.w.fault r34, 3) // verify user has write-access to *oset
  471. EX(.fail_efault, (p15) st8 [r34]=r3)
  472. mov r2=0 // i must not leak kernel bits...
  473. mov r3=0 // i must not leak kernel bits...
  474. mov r8=0 // return 0
  475. mov r9=0 // i must not leak kernel bits...
  476. mov r14=0 // i must not leak kernel bits...
  477. mov r17=0 // i must not leak kernel bits...
  478. mov r31=0 // i must not leak kernel bits...
  479. FSYS_RETURN
  480. .sig_pending:
  481. #ifdef CONFIG_SMP
  482. st4.rel [r31]=r0 // release the lock
  483. #endif
  484. SSM_PSR_I(p0, p9, r17)
  485. ;;
  486. srlz.d
  487. br.sptk.many fsys_fallback_syscall // with signal pending, do the heavy-weight syscall
  488. #ifdef CONFIG_SMP
  489. .lock_contention:
  490. /* Rather than spinning here, fall back on doing a heavy-weight syscall. */
  491. SSM_PSR_I(p0, p9, r17)
  492. ;;
  493. srlz.d
  494. br.sptk.many fsys_fallback_syscall
  495. #endif
  496. END(fsys_rt_sigprocmask)
  497. /*
  498. * fsys_getcpu doesn't use the third parameter in this implementation. It reads
  499. * current_thread_info()->cpu and corresponding node in cpu_to_node_map.
  500. */
  501. ENTRY(fsys_getcpu)
  502. .prologue
  503. .altrp b6
  504. .body
  505. ;;
  506. add r2=TI_FLAGS+IA64_TASK_SIZE,r16
  507. tnat.nz p6,p0 = r32 // guard against NaT argument
  508. add r3=TI_CPU+IA64_TASK_SIZE,r16
  509. ;;
  510. ld4 r3=[r3] // M r3 = thread_info->cpu
  511. ld4 r2=[r2] // M r2 = thread_info->flags
  512. (p6) br.cond.spnt.few .fail_einval // B
  513. ;;
  514. tnat.nz p7,p0 = r33 // I guard against NaT argument
  515. (p7) br.cond.spnt.few .fail_einval // B
  516. #ifdef CONFIG_NUMA
  517. movl r17=cpu_to_node_map
  518. ;;
  519. EX(.fail_efault, probe.w.fault r32, 3) // M This takes 5 cycles
  520. EX(.fail_efault, probe.w.fault r33, 3) // M This takes 5 cycles
  521. shladd r18=r3,1,r17
  522. ;;
  523. ld2 r20=[r18] // r20 = cpu_to_node_map[cpu]
  524. and r2 = TIF_ALLWORK_MASK,r2
  525. ;;
  526. cmp.ne p8,p0=0,r2
  527. (p8) br.spnt.many fsys_fallback_syscall
  528. ;;
  529. ;;
  530. EX(.fail_efault, st4 [r32] = r3)
  531. EX(.fail_efault, st2 [r33] = r20)
  532. mov r8=0
  533. ;;
  534. #else
  535. EX(.fail_efault, probe.w.fault r32, 3) // M This takes 5 cycles
  536. EX(.fail_efault, probe.w.fault r33, 3) // M This takes 5 cycles
  537. and r2 = TIF_ALLWORK_MASK,r2
  538. ;;
  539. cmp.ne p8,p0=0,r2
  540. (p8) br.spnt.many fsys_fallback_syscall
  541. ;;
  542. EX(.fail_efault, st4 [r32] = r3)
  543. EX(.fail_efault, st2 [r33] = r0)
  544. mov r8=0
  545. ;;
  546. #endif
  547. FSYS_RETURN
  548. END(fsys_getcpu)
  549. ENTRY(fsys_fallback_syscall)
  550. .prologue
  551. .altrp b6
  552. .body
  553. /*
  554. * We only get here from light-weight syscall handlers. Thus, we already
  555. * know that r15 contains a valid syscall number. No need to re-check.
  556. */
  557. adds r17=-1024,r15
  558. movl r14=sys_call_table
  559. ;;
  560. RSM_PSR_I(p0, r26, r27)
  561. shladd r18=r17,3,r14
  562. ;;
  563. ld8 r18=[r18] // load normal (heavy-weight) syscall entry-point
  564. MOV_FROM_PSR(p0, r29, r26) // read psr (12 cyc load latency)
  565. mov r27=ar.rsc
  566. mov r21=ar.fpsr
  567. mov r26=ar.pfs
  568. END(fsys_fallback_syscall)
  569. /* FALL THROUGH */
  570. GLOBAL_ENTRY(paravirt_fsys_bubble_down)
  571. .prologue
  572. .altrp b6
  573. .body
  574. /*
  575. * We get here for syscalls that don't have a lightweight
  576. * handler. For those, we need to bubble down into the kernel
  577. * and that requires setting up a minimal pt_regs structure,
  578. * and initializing the CPU state more or less as if an
  579. * interruption had occurred. To make syscall-restarts work,
  580. * we setup pt_regs such that cr_iip points to the second
  581. * instruction in syscall_via_break. Decrementing the IP
  582. * hence will restart the syscall via break and not
  583. * decrementing IP will return us to the caller, as usual.
  584. * Note that we preserve the value of psr.pp rather than
  585. * initializing it from dcr.pp. This makes it possible to
  586. * distinguish fsyscall execution from other privileged
  587. * execution.
  588. *
  589. * On entry:
  590. * - normal fsyscall handler register usage, except
  591. * that we also have:
  592. * - r18: address of syscall entry point
  593. * - r21: ar.fpsr
  594. * - r26: ar.pfs
  595. * - r27: ar.rsc
  596. * - r29: psr
  597. *
  598. * We used to clear some PSR bits here but that requires slow
  599. * serialization. Fortuntely, that isn't really necessary.
  600. * The rationale is as follows: we used to clear bits
  601. * ~PSR_PRESERVED_BITS in PSR.L. Since
  602. * PSR_PRESERVED_BITS==PSR.{UP,MFL,MFH,PK,DT,PP,SP,RT,IC}, we
  603. * ended up clearing PSR.{BE,AC,I,DFL,DFH,DI,DB,SI,TB}.
  604. * However,
  605. *
  606. * PSR.BE : already is turned off in __kernel_syscall_via_epc()
  607. * PSR.AC : don't care (kernel normally turns PSR.AC on)
  608. * PSR.I : already turned off by the time paravirt_fsys_bubble_down gets
  609. * invoked
  610. * PSR.DFL: always 0 (kernel never turns it on)
  611. * PSR.DFH: don't care --- kernel never touches f32-f127 on its own
  612. * initiative
  613. * PSR.DI : always 0 (kernel never turns it on)
  614. * PSR.SI : always 0 (kernel never turns it on)
  615. * PSR.DB : don't care --- kernel never enables kernel-level
  616. * breakpoints
  617. * PSR.TB : must be 0 already; if it wasn't zero on entry to
  618. * __kernel_syscall_via_epc, the branch to paravirt_fsys_bubble_down
  619. * will trigger a taken branch; the taken-trap-handler then
  620. * converts the syscall into a break-based system-call.
  621. */
  622. /*
  623. * Reading psr.l gives us only bits 0-31, psr.it, and psr.mc.
  624. * The rest we have to synthesize.
  625. */
  626. # define PSR_ONE_BITS ((3 << IA64_PSR_CPL0_BIT) \
  627. | (0x1 << IA64_PSR_RI_BIT) \
  628. | IA64_PSR_BN | IA64_PSR_I)
  629. invala // M0|1
  630. movl r14=ia64_ret_from_syscall // X
  631. nop.m 0
  632. movl r28=__kernel_syscall_via_break // X create cr.iip
  633. ;;
  634. mov r2=r16 // A get task addr to addl-addressable register
  635. adds r16=IA64_TASK_THREAD_ON_USTACK_OFFSET,r16 // A
  636. mov r31=pr // I0 save pr (2 cyc)
  637. ;;
  638. st1 [r16]=r0 // M2|3 clear current->thread.on_ustack flag
  639. addl r22=IA64_RBS_OFFSET,r2 // A compute base of RBS
  640. add r3=TI_FLAGS+IA64_TASK_SIZE,r2 // A
  641. ;;
  642. ld4 r3=[r3] // M0|1 r3 = current_thread_info()->flags
  643. lfetch.fault.excl.nt1 [r22] // M0|1 prefetch register backing-store
  644. nop.i 0
  645. ;;
  646. mov ar.rsc=0 // M2 set enforced lazy mode, pl 0, LE, loadrs=0
  647. #ifdef CONFIG_VIRT_CPU_ACCOUNTING
  648. MOV_FROM_ITC(p0, p6, r30, r23) // M get cycle for accounting
  649. #else
  650. nop.m 0
  651. #endif
  652. nop.i 0
  653. ;;
  654. mov r23=ar.bspstore // M2 (12 cyc) save ar.bspstore
  655. mov.m r24=ar.rnat // M2 (5 cyc) read ar.rnat (dual-issues!)
  656. nop.i 0
  657. ;;
  658. mov ar.bspstore=r22 // M2 (6 cyc) switch to kernel RBS
  659. movl r8=PSR_ONE_BITS // X
  660. ;;
  661. mov r25=ar.unat // M2 (5 cyc) save ar.unat
  662. mov r19=b6 // I0 save b6 (2 cyc)
  663. mov r20=r1 // A save caller's gp in r20
  664. ;;
  665. or r29=r8,r29 // A construct cr.ipsr value to save
  666. mov b6=r18 // I0 copy syscall entry-point to b6 (7 cyc)
  667. addl r1=IA64_STK_OFFSET-IA64_PT_REGS_SIZE,r2 // A compute base of memory stack
  668. mov r18=ar.bsp // M2 save (kernel) ar.bsp (12 cyc)
  669. cmp.ne pKStk,pUStk=r0,r0 // A set pKStk <- 0, pUStk <- 1
  670. br.call.sptk.many b7=ia64_syscall_setup // B
  671. ;;
  672. #ifdef CONFIG_VIRT_CPU_ACCOUNTING
  673. // mov.m r30=ar.itc is called in advance
  674. add r16=TI_AC_STAMP+IA64_TASK_SIZE,r2
  675. add r17=TI_AC_LEAVE+IA64_TASK_SIZE,r2
  676. ;;
  677. ld8 r18=[r16],TI_AC_STIME-TI_AC_STAMP // time at last check in kernel
  678. ld8 r19=[r17],TI_AC_UTIME-TI_AC_LEAVE // time at leave kernel
  679. ;;
  680. ld8 r20=[r16],TI_AC_STAMP-TI_AC_STIME // cumulated stime
  681. ld8 r21=[r17] // cumulated utime
  682. sub r22=r19,r18 // stime before leave kernel
  683. ;;
  684. st8 [r16]=r30,TI_AC_STIME-TI_AC_STAMP // update stamp
  685. sub r18=r30,r19 // elapsed time in user mode
  686. ;;
  687. add r20=r20,r22 // sum stime
  688. add r21=r21,r18 // sum utime
  689. ;;
  690. st8 [r16]=r20 // update stime
  691. st8 [r17]=r21 // update utime
  692. ;;
  693. #endif
  694. mov ar.rsc=0x3 // M2 set eager mode, pl 0, LE, loadrs=0
  695. mov rp=r14 // I0 set the real return addr
  696. and r3=_TIF_SYSCALL_TRACEAUDIT,r3 // A
  697. ;;
  698. SSM_PSR_I(p0, p6, r22) // M2 we're on kernel stacks now, reenable irqs
  699. cmp.eq p8,p0=r3,r0 // A
  700. (p10) br.cond.spnt.many ia64_ret_from_syscall // B return if bad call-frame or r15 is a NaT
  701. nop.m 0
  702. (p8) br.call.sptk.many b6=b6 // B (ignore return address)
  703. br.cond.spnt ia64_trace_syscall // B
  704. END(paravirt_fsys_bubble_down)
  705. .rodata
  706. .align 8
  707. .globl paravirt_fsyscall_table
  708. data8 paravirt_fsys_bubble_down
  709. paravirt_fsyscall_table:
  710. data8 fsys_ni_syscall
  711. data8 0 // exit // 1025
  712. data8 0 // read
  713. data8 0 // write
  714. data8 0 // open
  715. data8 0 // close
  716. data8 0 // creat // 1030
  717. data8 0 // link
  718. data8 0 // unlink
  719. data8 0 // execve
  720. data8 0 // chdir
  721. data8 0 // fchdir // 1035
  722. data8 0 // utimes
  723. data8 0 // mknod
  724. data8 0 // chmod
  725. data8 0 // chown
  726. data8 0 // lseek // 1040
  727. data8 fsys_getpid // getpid
  728. data8 fsys_getppid // getppid
  729. data8 0 // mount
  730. data8 0 // umount
  731. data8 0 // setuid // 1045
  732. data8 0 // getuid
  733. data8 0 // geteuid
  734. data8 0 // ptrace
  735. data8 0 // access
  736. data8 0 // sync // 1050
  737. data8 0 // fsync
  738. data8 0 // fdatasync
  739. data8 0 // kill
  740. data8 0 // rename
  741. data8 0 // mkdir // 1055
  742. data8 0 // rmdir
  743. data8 0 // dup
  744. data8 0 // pipe
  745. data8 0 // times
  746. data8 0 // brk // 1060
  747. data8 0 // setgid
  748. data8 0 // getgid
  749. data8 0 // getegid
  750. data8 0 // acct
  751. data8 0 // ioctl // 1065
  752. data8 0 // fcntl
  753. data8 0 // umask
  754. data8 0 // chroot
  755. data8 0 // ustat
  756. data8 0 // dup2 // 1070
  757. data8 0 // setreuid
  758. data8 0 // setregid
  759. data8 0 // getresuid
  760. data8 0 // setresuid
  761. data8 0 // getresgid // 1075
  762. data8 0 // setresgid
  763. data8 0 // getgroups
  764. data8 0 // setgroups
  765. data8 0 // getpgid
  766. data8 0 // setpgid // 1080
  767. data8 0 // setsid
  768. data8 0 // getsid
  769. data8 0 // sethostname
  770. data8 0 // setrlimit
  771. data8 0 // getrlimit // 1085
  772. data8 0 // getrusage
  773. data8 fsys_gettimeofday // gettimeofday
  774. data8 0 // settimeofday
  775. data8 0 // select
  776. data8 0 // poll // 1090
  777. data8 0 // symlink
  778. data8 0 // readlink
  779. data8 0 // uselib
  780. data8 0 // swapon
  781. data8 0 // swapoff // 1095
  782. data8 0 // reboot
  783. data8 0 // truncate
  784. data8 0 // ftruncate
  785. data8 0 // fchmod
  786. data8 0 // fchown // 1100
  787. data8 0 // getpriority
  788. data8 0 // setpriority
  789. data8 0 // statfs
  790. data8 0 // fstatfs
  791. data8 0 // gettid // 1105
  792. data8 0 // semget
  793. data8 0 // semop
  794. data8 0 // semctl
  795. data8 0 // msgget
  796. data8 0 // msgsnd // 1110
  797. data8 0 // msgrcv
  798. data8 0 // msgctl
  799. data8 0 // shmget
  800. data8 0 // shmat
  801. data8 0 // shmdt // 1115
  802. data8 0 // shmctl
  803. data8 0 // syslog
  804. data8 0 // setitimer
  805. data8 0 // getitimer
  806. data8 0 // 1120
  807. data8 0
  808. data8 0
  809. data8 0 // vhangup
  810. data8 0 // lchown
  811. data8 0 // remap_file_pages // 1125
  812. data8 0 // wait4
  813. data8 0 // sysinfo
  814. data8 0 // clone
  815. data8 0 // setdomainname
  816. data8 0 // newuname // 1130
  817. data8 0 // adjtimex
  818. data8 0
  819. data8 0 // init_module
  820. data8 0 // delete_module
  821. data8 0 // 1135
  822. data8 0
  823. data8 0 // quotactl
  824. data8 0 // bdflush
  825. data8 0 // sysfs
  826. data8 0 // personality // 1140
  827. data8 0 // afs_syscall
  828. data8 0 // setfsuid
  829. data8 0 // setfsgid
  830. data8 0 // getdents
  831. data8 0 // flock // 1145
  832. data8 0 // readv
  833. data8 0 // writev
  834. data8 0 // pread64
  835. data8 0 // pwrite64
  836. data8 0 // sysctl // 1150
  837. data8 0 // mmap
  838. data8 0 // munmap
  839. data8 0 // mlock
  840. data8 0 // mlockall
  841. data8 0 // mprotect // 1155
  842. data8 0 // mremap
  843. data8 0 // msync
  844. data8 0 // munlock
  845. data8 0 // munlockall
  846. data8 0 // sched_getparam // 1160
  847. data8 0 // sched_setparam
  848. data8 0 // sched_getscheduler
  849. data8 0 // sched_setscheduler
  850. data8 0 // sched_yield
  851. data8 0 // sched_get_priority_max // 1165
  852. data8 0 // sched_get_priority_min
  853. data8 0 // sched_rr_get_interval
  854. data8 0 // nanosleep
  855. data8 0 // nfsservctl
  856. data8 0 // prctl // 1170
  857. data8 0 // getpagesize
  858. data8 0 // mmap2
  859. data8 0 // pciconfig_read
  860. data8 0 // pciconfig_write
  861. data8 0 // perfmonctl // 1175
  862. data8 0 // sigaltstack
  863. data8 0 // rt_sigaction
  864. data8 0 // rt_sigpending
  865. data8 fsys_rt_sigprocmask // rt_sigprocmask
  866. data8 0 // rt_sigqueueinfo // 1180
  867. data8 0 // rt_sigreturn
  868. data8 0 // rt_sigsuspend
  869. data8 0 // rt_sigtimedwait
  870. data8 0 // getcwd
  871. data8 0 // capget // 1185
  872. data8 0 // capset
  873. data8 0 // sendfile
  874. data8 0
  875. data8 0
  876. data8 0 // socket // 1190
  877. data8 0 // bind
  878. data8 0 // connect
  879. data8 0 // listen
  880. data8 0 // accept
  881. data8 0 // getsockname // 1195
  882. data8 0 // getpeername
  883. data8 0 // socketpair
  884. data8 0 // send
  885. data8 0 // sendto
  886. data8 0 // recv // 1200
  887. data8 0 // recvfrom
  888. data8 0 // shutdown
  889. data8 0 // setsockopt
  890. data8 0 // getsockopt
  891. data8 0 // sendmsg // 1205
  892. data8 0 // recvmsg
  893. data8 0 // pivot_root
  894. data8 0 // mincore
  895. data8 0 // madvise
  896. data8 0 // newstat // 1210
  897. data8 0 // newlstat
  898. data8 0 // newfstat
  899. data8 0 // clone2
  900. data8 0 // getdents64
  901. data8 0 // getunwind // 1215
  902. data8 0 // readahead
  903. data8 0 // setxattr
  904. data8 0 // lsetxattr
  905. data8 0 // fsetxattr
  906. data8 0 // getxattr // 1220
  907. data8 0 // lgetxattr
  908. data8 0 // fgetxattr
  909. data8 0 // listxattr
  910. data8 0 // llistxattr
  911. data8 0 // flistxattr // 1225
  912. data8 0 // removexattr
  913. data8 0 // lremovexattr
  914. data8 0 // fremovexattr
  915. data8 0 // tkill
  916. data8 0 // futex // 1230
  917. data8 0 // sched_setaffinity
  918. data8 0 // sched_getaffinity
  919. data8 fsys_set_tid_address // set_tid_address
  920. data8 0 // fadvise64_64
  921. data8 0 // tgkill // 1235
  922. data8 0 // exit_group
  923. data8 0 // lookup_dcookie
  924. data8 0 // io_setup
  925. data8 0 // io_destroy
  926. data8 0 // io_getevents // 1240
  927. data8 0 // io_submit
  928. data8 0 // io_cancel
  929. data8 0 // epoll_create
  930. data8 0 // epoll_ctl
  931. data8 0 // epoll_wait // 1245
  932. data8 0 // restart_syscall
  933. data8 0 // semtimedop
  934. data8 0 // timer_create
  935. data8 0 // timer_settime
  936. data8 0 // timer_gettime // 1250
  937. data8 0 // timer_getoverrun
  938. data8 0 // timer_delete
  939. data8 0 // clock_settime
  940. data8 fsys_clock_gettime // clock_gettime
  941. data8 0 // clock_getres // 1255
  942. data8 0 // clock_nanosleep
  943. data8 0 // fstatfs64
  944. data8 0 // statfs64
  945. data8 0 // mbind
  946. data8 0 // get_mempolicy // 1260
  947. data8 0 // set_mempolicy
  948. data8 0 // mq_open
  949. data8 0 // mq_unlink
  950. data8 0 // mq_timedsend
  951. data8 0 // mq_timedreceive // 1265
  952. data8 0 // mq_notify
  953. data8 0 // mq_getsetattr
  954. data8 0 // kexec_load
  955. data8 0 // vserver
  956. data8 0 // waitid // 1270
  957. data8 0 // add_key
  958. data8 0 // request_key
  959. data8 0 // keyctl
  960. data8 0 // ioprio_set
  961. data8 0 // ioprio_get // 1275
  962. data8 0 // move_pages
  963. data8 0 // inotify_init
  964. data8 0 // inotify_add_watch
  965. data8 0 // inotify_rm_watch
  966. data8 0 // migrate_pages // 1280
  967. data8 0 // openat
  968. data8 0 // mkdirat
  969. data8 0 // mknodat
  970. data8 0 // fchownat
  971. data8 0 // futimesat // 1285
  972. data8 0 // newfstatat
  973. data8 0 // unlinkat
  974. data8 0 // renameat
  975. data8 0 // linkat
  976. data8 0 // symlinkat // 1290
  977. data8 0 // readlinkat
  978. data8 0 // fchmodat
  979. data8 0 // faccessat
  980. data8 0
  981. data8 0 // 1295
  982. data8 0 // unshare
  983. data8 0 // splice
  984. data8 0 // set_robust_list
  985. data8 0 // get_robust_list
  986. data8 0 // sync_file_range // 1300
  987. data8 0 // tee
  988. data8 0 // vmsplice
  989. data8 0
  990. data8 fsys_getcpu // getcpu // 1304
  991. // fill in zeros for the remaining entries
  992. .zero:
  993. .space paravirt_fsyscall_table + 8*NR_syscalls - .zero, 0