bitops.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495
  1. #ifndef _PARISC_BITOPS_H
  2. #define _PARISC_BITOPS_H
  3. #include <linux/compiler.h>
  4. #include <asm/types.h> /* for BITS_PER_LONG/SHIFT_PER_LONG */
  5. #include <asm/byteorder.h>
  6. #include <asm/atomic.h>
  7. /*
  8. * HP-PARISC specific bit operations
  9. * for a detailed description of the functions please refer
  10. * to include/asm-i386/bitops.h or kerneldoc
  11. */
  12. #define CHOP_SHIFTCOUNT(x) (((unsigned long) (x)) & (BITS_PER_LONG - 1))
  13. #define smp_mb__before_clear_bit() smp_mb()
  14. #define smp_mb__after_clear_bit() smp_mb()
  15. /* See http://marc.theaimsgroup.com/?t=108826637900003 for discussion
  16. * on use of volatile and __*_bit() (set/clear/change):
  17. * *_bit() want use of volatile.
  18. * __*_bit() are "relaxed" and don't use spinlock or volatile.
  19. */
  20. static __inline__ void set_bit(int nr, volatile unsigned long * addr)
  21. {
  22. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  23. unsigned long flags;
  24. addr += (nr >> SHIFT_PER_LONG);
  25. _atomic_spin_lock_irqsave(addr, flags);
  26. *addr |= mask;
  27. _atomic_spin_unlock_irqrestore(addr, flags);
  28. }
  29. static __inline__ void __set_bit(unsigned long nr, volatile unsigned long * addr)
  30. {
  31. unsigned long *m = (unsigned long *) addr + (nr >> SHIFT_PER_LONG);
  32. *m |= 1UL << CHOP_SHIFTCOUNT(nr);
  33. }
  34. static __inline__ void clear_bit(int nr, volatile unsigned long * addr)
  35. {
  36. unsigned long mask = ~(1UL << CHOP_SHIFTCOUNT(nr));
  37. unsigned long flags;
  38. addr += (nr >> SHIFT_PER_LONG);
  39. _atomic_spin_lock_irqsave(addr, flags);
  40. *addr &= mask;
  41. _atomic_spin_unlock_irqrestore(addr, flags);
  42. }
  43. static __inline__ void __clear_bit(unsigned long nr, volatile unsigned long * addr)
  44. {
  45. unsigned long *m = (unsigned long *) addr + (nr >> SHIFT_PER_LONG);
  46. *m &= ~(1UL << CHOP_SHIFTCOUNT(nr));
  47. }
  48. static __inline__ void change_bit(int nr, volatile unsigned long * addr)
  49. {
  50. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  51. unsigned long flags;
  52. addr += (nr >> SHIFT_PER_LONG);
  53. _atomic_spin_lock_irqsave(addr, flags);
  54. *addr ^= mask;
  55. _atomic_spin_unlock_irqrestore(addr, flags);
  56. }
  57. static __inline__ void __change_bit(unsigned long nr, volatile unsigned long * addr)
  58. {
  59. unsigned long *m = (unsigned long *) addr + (nr >> SHIFT_PER_LONG);
  60. *m ^= 1UL << CHOP_SHIFTCOUNT(nr);
  61. }
  62. static __inline__ int test_and_set_bit(int nr, volatile unsigned long * addr)
  63. {
  64. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  65. unsigned long oldbit;
  66. unsigned long flags;
  67. addr += (nr >> SHIFT_PER_LONG);
  68. _atomic_spin_lock_irqsave(addr, flags);
  69. oldbit = *addr;
  70. *addr = oldbit | mask;
  71. _atomic_spin_unlock_irqrestore(addr, flags);
  72. return (oldbit & mask) ? 1 : 0;
  73. }
  74. static __inline__ int __test_and_set_bit(int nr, volatile unsigned long * address)
  75. {
  76. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  77. unsigned long oldbit;
  78. unsigned long *addr = (unsigned long *)address + (nr >> SHIFT_PER_LONG);
  79. oldbit = *addr;
  80. *addr = oldbit | mask;
  81. return (oldbit & mask) ? 1 : 0;
  82. }
  83. static __inline__ int test_and_clear_bit(int nr, volatile unsigned long * addr)
  84. {
  85. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  86. unsigned long oldbit;
  87. unsigned long flags;
  88. addr += (nr >> SHIFT_PER_LONG);
  89. _atomic_spin_lock_irqsave(addr, flags);
  90. oldbit = *addr;
  91. *addr = oldbit & ~mask;
  92. _atomic_spin_unlock_irqrestore(addr, flags);
  93. return (oldbit & mask) ? 1 : 0;
  94. }
  95. static __inline__ int __test_and_clear_bit(int nr, volatile unsigned long * address)
  96. {
  97. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  98. unsigned long *addr = (unsigned long *)address + (nr >> SHIFT_PER_LONG);
  99. unsigned long oldbit;
  100. oldbit = *addr;
  101. *addr = oldbit & ~mask;
  102. return (oldbit & mask) ? 1 : 0;
  103. }
  104. static __inline__ int test_and_change_bit(int nr, volatile unsigned long * addr)
  105. {
  106. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  107. unsigned long oldbit;
  108. unsigned long flags;
  109. addr += (nr >> SHIFT_PER_LONG);
  110. _atomic_spin_lock_irqsave(addr, flags);
  111. oldbit = *addr;
  112. *addr = oldbit ^ mask;
  113. _atomic_spin_unlock_irqrestore(addr, flags);
  114. return (oldbit & mask) ? 1 : 0;
  115. }
  116. static __inline__ int __test_and_change_bit(int nr, volatile unsigned long * address)
  117. {
  118. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  119. unsigned long *addr = (unsigned long *)address + (nr >> SHIFT_PER_LONG);
  120. unsigned long oldbit;
  121. oldbit = *addr;
  122. *addr = oldbit ^ mask;
  123. return (oldbit & mask) ? 1 : 0;
  124. }
  125. static __inline__ int test_bit(int nr, const volatile unsigned long *address)
  126. {
  127. unsigned long mask = 1UL << CHOP_SHIFTCOUNT(nr);
  128. const unsigned long *addr = (const unsigned long *)address + (nr >> SHIFT_PER_LONG);
  129. return !!(*addr & mask);
  130. }
  131. #ifdef __KERNEL__
  132. /**
  133. * __ffs - find first bit in word. returns 0 to "BITS_PER_LONG-1".
  134. * @word: The word to search
  135. *
  136. * __ffs() return is undefined if no bit is set.
  137. *
  138. * 32-bit fast __ffs by LaMont Jones "lamont At hp com".
  139. * 64-bit enhancement by Grant Grundler "grundler At parisc-linux org".
  140. * (with help from willy/jejb to get the semantics right)
  141. *
  142. * This algorithm avoids branches by making use of nullification.
  143. * One side effect of "extr" instructions is it sets PSW[N] bit.
  144. * How PSW[N] (nullify next insn) gets set is determined by the
  145. * "condition" field (eg "<>" or "TR" below) in the extr* insn.
  146. * Only the 1st and one of either the 2cd or 3rd insn will get executed.
  147. * Each set of 3 insn will get executed in 2 cycles on PA8x00 vs 16 or so
  148. * cycles for each mispredicted branch.
  149. */
  150. static __inline__ unsigned long __ffs(unsigned long x)
  151. {
  152. unsigned long ret;
  153. __asm__(
  154. #ifdef __LP64__
  155. " ldi 63,%1\n"
  156. " extrd,u,*<> %0,63,32,%%r0\n"
  157. " extrd,u,*TR %0,31,32,%0\n" /* move top 32-bits down */
  158. " addi -32,%1,%1\n"
  159. #else
  160. " ldi 31,%1\n"
  161. #endif
  162. " extru,<> %0,31,16,%%r0\n"
  163. " extru,TR %0,15,16,%0\n" /* xxxx0000 -> 0000xxxx */
  164. " addi -16,%1,%1\n"
  165. " extru,<> %0,31,8,%%r0\n"
  166. " extru,TR %0,23,8,%0\n" /* 0000xx00 -> 000000xx */
  167. " addi -8,%1,%1\n"
  168. " extru,<> %0,31,4,%%r0\n"
  169. " extru,TR %0,27,4,%0\n" /* 000000x0 -> 0000000x */
  170. " addi -4,%1,%1\n"
  171. " extru,<> %0,31,2,%%r0\n"
  172. " extru,TR %0,29,2,%0\n" /* 0000000y, 1100b -> 0011b */
  173. " addi -2,%1,%1\n"
  174. " extru,= %0,31,1,%%r0\n" /* check last bit */
  175. " addi -1,%1,%1\n"
  176. : "+r" (x), "=r" (ret) );
  177. return ret;
  178. }
  179. /* Undefined if no bit is zero. */
  180. #define ffz(x) __ffs(~x)
  181. /*
  182. * ffs: find first bit set. returns 1 to BITS_PER_LONG or 0 (if none set)
  183. * This is defined the same way as the libc and compiler builtin
  184. * ffs routines, therefore differs in spirit from the above ffz (man ffs).
  185. */
  186. static __inline__ int ffs(int x)
  187. {
  188. return x ? (__ffs((unsigned long)x) + 1) : 0;
  189. }
  190. /*
  191. * fls: find last (most significant) bit set.
  192. * fls(0) = 0, fls(1) = 1, fls(0x80000000) = 32.
  193. */
  194. static __inline__ int fls(int x)
  195. {
  196. int ret;
  197. if (!x)
  198. return 0;
  199. __asm__(
  200. " ldi 1,%1\n"
  201. " extru,<> %0,15,16,%%r0\n"
  202. " zdep,TR %0,15,16,%0\n" /* xxxx0000 */
  203. " addi 16,%1,%1\n"
  204. " extru,<> %0,7,8,%%r0\n"
  205. " zdep,TR %0,23,24,%0\n" /* xx000000 */
  206. " addi 8,%1,%1\n"
  207. " extru,<> %0,3,4,%%r0\n"
  208. " zdep,TR %0,27,28,%0\n" /* x0000000 */
  209. " addi 4,%1,%1\n"
  210. " extru,<> %0,1,2,%%r0\n"
  211. " zdep,TR %0,29,30,%0\n" /* y0000000 (y&3 = 0) */
  212. " addi 2,%1,%1\n"
  213. " extru,= %0,0,1,%%r0\n"
  214. " addi 1,%1,%1\n" /* if y & 8, add 1 */
  215. : "+r" (x), "=r" (ret) );
  216. return ret;
  217. }
  218. #define fls64(x) generic_fls64(x)
  219. /*
  220. * hweightN: returns the hamming weight (i.e. the number
  221. * of bits set) of a N-bit word
  222. */
  223. #define hweight64(x) generic_hweight64(x)
  224. #define hweight32(x) generic_hweight32(x)
  225. #define hweight16(x) generic_hweight16(x)
  226. #define hweight8(x) generic_hweight8(x)
  227. /*
  228. * Every architecture must define this function. It's the fastest
  229. * way of searching a 140-bit bitmap where the first 100 bits are
  230. * unlikely to be set. It's guaranteed that at least one of the 140
  231. * bits is cleared.
  232. */
  233. static inline int sched_find_first_bit(const unsigned long *b)
  234. {
  235. #ifdef __LP64__
  236. if (unlikely(b[0]))
  237. return __ffs(b[0]);
  238. if (unlikely(b[1]))
  239. return __ffs(b[1]) + 64;
  240. return __ffs(b[2]) + 128;
  241. #else
  242. if (unlikely(b[0]))
  243. return __ffs(b[0]);
  244. if (unlikely(b[1]))
  245. return __ffs(b[1]) + 32;
  246. if (unlikely(b[2]))
  247. return __ffs(b[2]) + 64;
  248. if (b[3])
  249. return __ffs(b[3]) + 96;
  250. return __ffs(b[4]) + 128;
  251. #endif
  252. }
  253. #endif /* __KERNEL__ */
  254. /*
  255. * This implementation of find_{first,next}_zero_bit was stolen from
  256. * Linus' asm-alpha/bitops.h.
  257. */
  258. #define find_first_zero_bit(addr, size) \
  259. find_next_zero_bit((addr), (size), 0)
  260. static __inline__ unsigned long find_next_zero_bit(const void * addr, unsigned long size, unsigned long offset)
  261. {
  262. const unsigned long * p = ((unsigned long *) addr) + (offset >> SHIFT_PER_LONG);
  263. unsigned long result = offset & ~(BITS_PER_LONG-1);
  264. unsigned long tmp;
  265. if (offset >= size)
  266. return size;
  267. size -= result;
  268. offset &= (BITS_PER_LONG-1);
  269. if (offset) {
  270. tmp = *(p++);
  271. tmp |= ~0UL >> (BITS_PER_LONG-offset);
  272. if (size < BITS_PER_LONG)
  273. goto found_first;
  274. if (~tmp)
  275. goto found_middle;
  276. size -= BITS_PER_LONG;
  277. result += BITS_PER_LONG;
  278. }
  279. while (size & ~(BITS_PER_LONG -1)) {
  280. if (~(tmp = *(p++)))
  281. goto found_middle;
  282. result += BITS_PER_LONG;
  283. size -= BITS_PER_LONG;
  284. }
  285. if (!size)
  286. return result;
  287. tmp = *p;
  288. found_first:
  289. tmp |= ~0UL << size;
  290. found_middle:
  291. return result + ffz(tmp);
  292. }
  293. static __inline__ unsigned long find_next_bit(const unsigned long *addr, unsigned long size, unsigned long offset)
  294. {
  295. const unsigned long *p = addr + (offset >> SHIFT_PER_LONG);
  296. unsigned long result = offset & ~(BITS_PER_LONG-1);
  297. unsigned long tmp;
  298. if (offset >= size)
  299. return size;
  300. size -= result;
  301. offset &= (BITS_PER_LONG-1);
  302. if (offset) {
  303. tmp = *(p++);
  304. tmp &= (~0UL << offset);
  305. if (size < BITS_PER_LONG)
  306. goto found_first;
  307. if (tmp)
  308. goto found_middle;
  309. size -= BITS_PER_LONG;
  310. result += BITS_PER_LONG;
  311. }
  312. while (size & ~(BITS_PER_LONG-1)) {
  313. if ((tmp = *(p++)))
  314. goto found_middle;
  315. result += BITS_PER_LONG;
  316. size -= BITS_PER_LONG;
  317. }
  318. if (!size)
  319. return result;
  320. tmp = *p;
  321. found_first:
  322. tmp &= (~0UL >> (BITS_PER_LONG - size));
  323. if (tmp == 0UL) /* Are any bits set? */
  324. return result + size; /* Nope. */
  325. found_middle:
  326. return result + __ffs(tmp);
  327. }
  328. /**
  329. * find_first_bit - find the first set bit in a memory region
  330. * @addr: The address to start the search at
  331. * @size: The maximum size to search
  332. *
  333. * Returns the bit-number of the first set bit, not the number of the byte
  334. * containing a bit.
  335. */
  336. #define find_first_bit(addr, size) \
  337. find_next_bit((addr), (size), 0)
  338. #define _EXT2_HAVE_ASM_BITOPS_
  339. #ifdef __KERNEL__
  340. /*
  341. * test_and_{set,clear}_bit guarantee atomicity without
  342. * disabling interrupts.
  343. */
  344. /* '3' is bits per byte */
  345. #define LE_BYTE_ADDR ((sizeof(unsigned long) - 1) << 3)
  346. #define ext2_test_bit(nr, addr) \
  347. test_bit((nr) ^ LE_BYTE_ADDR, (unsigned long *)addr)
  348. #define ext2_set_bit(nr, addr) \
  349. __test_and_set_bit((nr) ^ LE_BYTE_ADDR, (unsigned long *)addr)
  350. #define ext2_clear_bit(nr, addr) \
  351. __test_and_clear_bit((nr) ^ LE_BYTE_ADDR, (unsigned long *)addr)
  352. #define ext2_set_bit_atomic(l,nr,addr) \
  353. test_and_set_bit((nr) ^ LE_BYTE_ADDR, (unsigned long *)addr)
  354. #define ext2_clear_bit_atomic(l,nr,addr) \
  355. test_and_clear_bit( (nr) ^ LE_BYTE_ADDR, (unsigned long *)addr)
  356. #endif /* __KERNEL__ */
  357. #define ext2_find_first_zero_bit(addr, size) \
  358. ext2_find_next_zero_bit((addr), (size), 0)
  359. /* include/linux/byteorder does not support "unsigned long" type */
  360. static inline unsigned long ext2_swabp(unsigned long * x)
  361. {
  362. #ifdef __LP64__
  363. return (unsigned long) __swab64p((u64 *) x);
  364. #else
  365. return (unsigned long) __swab32p((u32 *) x);
  366. #endif
  367. }
  368. /* include/linux/byteorder doesn't support "unsigned long" type */
  369. static inline unsigned long ext2_swab(unsigned long y)
  370. {
  371. #ifdef __LP64__
  372. return (unsigned long) __swab64((u64) y);
  373. #else
  374. return (unsigned long) __swab32((u32) y);
  375. #endif
  376. }
  377. static __inline__ unsigned long ext2_find_next_zero_bit(void *addr, unsigned long size, unsigned long offset)
  378. {
  379. unsigned long *p = (unsigned long *) addr + (offset >> SHIFT_PER_LONG);
  380. unsigned long result = offset & ~(BITS_PER_LONG - 1);
  381. unsigned long tmp;
  382. if (offset >= size)
  383. return size;
  384. size -= result;
  385. offset &= (BITS_PER_LONG - 1UL);
  386. if (offset) {
  387. tmp = ext2_swabp(p++);
  388. tmp |= (~0UL >> (BITS_PER_LONG - offset));
  389. if (size < BITS_PER_LONG)
  390. goto found_first;
  391. if (~tmp)
  392. goto found_middle;
  393. size -= BITS_PER_LONG;
  394. result += BITS_PER_LONG;
  395. }
  396. while (size & ~(BITS_PER_LONG - 1)) {
  397. if (~(tmp = *(p++)))
  398. goto found_middle_swap;
  399. result += BITS_PER_LONG;
  400. size -= BITS_PER_LONG;
  401. }
  402. if (!size)
  403. return result;
  404. tmp = ext2_swabp(p);
  405. found_first:
  406. tmp |= ~0UL << size;
  407. if (tmp == ~0UL) /* Are any bits zero? */
  408. return result + size; /* Nope. Skip ffz */
  409. found_middle:
  410. return result + ffz(tmp);
  411. found_middle_swap:
  412. return result + ffz(ext2_swab(tmp));
  413. }
  414. /* Bitmap functions for the minix filesystem. */
  415. #define minix_test_and_set_bit(nr,addr) ext2_set_bit(nr,addr)
  416. #define minix_set_bit(nr,addr) ((void)ext2_set_bit(nr,addr))
  417. #define minix_test_and_clear_bit(nr,addr) ext2_clear_bit(nr,addr)
  418. #define minix_test_bit(nr,addr) ext2_test_bit(nr,addr)
  419. #define minix_find_first_zero_bit(addr,size) ext2_find_first_zero_bit(addr,size)
  420. #endif /* _PARISC_BITOPS_H */