raid6mmx.c 4.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150
  1. /* -*- linux-c -*- ------------------------------------------------------- *
  2. *
  3. * Copyright 2002 H. Peter Anvin - All Rights Reserved
  4. *
  5. * This program is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU General Public License as published by
  7. * the Free Software Foundation, Inc., 53 Temple Place Ste 330,
  8. * Bostom MA 02111-1307, USA; either version 2 of the License, or
  9. * (at your option) any later version; incorporated herein by reference.
  10. *
  11. * ----------------------------------------------------------------------- */
  12. /*
  13. * raid6mmx.c
  14. *
  15. * MMX implementation of RAID-6 syndrome functions
  16. */
  17. #if defined(__i386__)
  18. #include "raid6.h"
  19. #include "raid6x86.h"
  20. /* Shared with raid6sse1.c */
  21. const struct raid6_mmx_constants {
  22. u64 x1d;
  23. } raid6_mmx_constants = {
  24. 0x1d1d1d1d1d1d1d1dULL,
  25. };
  26. static int raid6_have_mmx(void)
  27. {
  28. #ifdef __KERNEL__
  29. /* Not really "boot_cpu" but "all_cpus" */
  30. return boot_cpu_has(X86_FEATURE_MMX);
  31. #else
  32. /* User space test code */
  33. u32 features = cpuid_features();
  34. return ( (features & (1<<23)) == (1<<23) );
  35. #endif
  36. }
  37. /*
  38. * Plain MMX implementation
  39. */
  40. static void raid6_mmx1_gen_syndrome(int disks, size_t bytes, void **ptrs)
  41. {
  42. u8 **dptr = (u8 **)ptrs;
  43. u8 *p, *q;
  44. int d, z, z0;
  45. raid6_mmx_save_t sa;
  46. z0 = disks - 3; /* Highest data disk */
  47. p = dptr[z0+1]; /* XOR parity */
  48. q = dptr[z0+2]; /* RS syndrome */
  49. raid6_before_mmx(&sa);
  50. asm volatile("movq %0,%%mm0" : : "m" (raid6_mmx_constants.x1d));
  51. asm volatile("pxor %mm5,%mm5"); /* Zero temp */
  52. for ( d = 0 ; d < bytes ; d += 8 ) {
  53. asm volatile("movq %0,%%mm2" : : "m" (dptr[z0][d])); /* P[0] */
  54. asm volatile("movq %mm2,%mm4"); /* Q[0] */
  55. for ( z = z0-1 ; z >= 0 ; z-- ) {
  56. asm volatile("movq %0,%%mm6" : : "m" (dptr[z][d]));
  57. asm volatile("pcmpgtb %mm4,%mm5");
  58. asm volatile("paddb %mm4,%mm4");
  59. asm volatile("pand %mm0,%mm5");
  60. asm volatile("pxor %mm5,%mm4");
  61. asm volatile("pxor %mm5,%mm5");
  62. asm volatile("pxor %mm6,%mm2");
  63. asm volatile("pxor %mm6,%mm4");
  64. }
  65. asm volatile("movq %%mm2,%0" : "=m" (p[d]));
  66. asm volatile("pxor %mm2,%mm2");
  67. asm volatile("movq %%mm4,%0" : "=m" (q[d]));
  68. asm volatile("pxor %mm4,%mm4");
  69. }
  70. raid6_after_mmx(&sa);
  71. }
  72. const struct raid6_calls raid6_mmxx1 = {
  73. raid6_mmx1_gen_syndrome,
  74. raid6_have_mmx,
  75. "mmxx1",
  76. 0
  77. };
  78. /*
  79. * Unrolled-by-2 MMX implementation
  80. */
  81. static void raid6_mmx2_gen_syndrome(int disks, size_t bytes, void **ptrs)
  82. {
  83. u8 **dptr = (u8 **)ptrs;
  84. u8 *p, *q;
  85. int d, z, z0;
  86. raid6_mmx_save_t sa;
  87. z0 = disks - 3; /* Highest data disk */
  88. p = dptr[z0+1]; /* XOR parity */
  89. q = dptr[z0+2]; /* RS syndrome */
  90. raid6_before_mmx(&sa);
  91. asm volatile("movq %0,%%mm0" : : "m" (raid6_mmx_constants.x1d));
  92. asm volatile("pxor %mm5,%mm5"); /* Zero temp */
  93. asm volatile("pxor %mm7,%mm7"); /* Zero temp */
  94. for ( d = 0 ; d < bytes ; d += 16 ) {
  95. asm volatile("movq %0,%%mm2" : : "m" (dptr[z0][d])); /* P[0] */
  96. asm volatile("movq %0,%%mm3" : : "m" (dptr[z0][d+8]));
  97. asm volatile("movq %mm2,%mm4"); /* Q[0] */
  98. asm volatile("movq %mm3,%mm6"); /* Q[1] */
  99. for ( z = z0-1 ; z >= 0 ; z-- ) {
  100. asm volatile("pcmpgtb %mm4,%mm5");
  101. asm volatile("pcmpgtb %mm6,%mm7");
  102. asm volatile("paddb %mm4,%mm4");
  103. asm volatile("paddb %mm6,%mm6");
  104. asm volatile("pand %mm0,%mm5");
  105. asm volatile("pand %mm0,%mm7");
  106. asm volatile("pxor %mm5,%mm4");
  107. asm volatile("pxor %mm7,%mm6");
  108. asm volatile("movq %0,%%mm5" : : "m" (dptr[z][d]));
  109. asm volatile("movq %0,%%mm7" : : "m" (dptr[z][d+8]));
  110. asm volatile("pxor %mm5,%mm2");
  111. asm volatile("pxor %mm7,%mm3");
  112. asm volatile("pxor %mm5,%mm4");
  113. asm volatile("pxor %mm7,%mm6");
  114. asm volatile("pxor %mm5,%mm5");
  115. asm volatile("pxor %mm7,%mm7");
  116. }
  117. asm volatile("movq %%mm2,%0" : "=m" (p[d]));
  118. asm volatile("movq %%mm3,%0" : "=m" (p[d+8]));
  119. asm volatile("movq %%mm4,%0" : "=m" (q[d]));
  120. asm volatile("movq %%mm6,%0" : "=m" (q[d+8]));
  121. }
  122. raid6_after_mmx(&sa);
  123. }
  124. const struct raid6_calls raid6_mmxx2 = {
  125. raid6_mmx2_gen_syndrome,
  126. raid6_have_mmx,
  127. "mmxx2",
  128. 0
  129. };
  130. #endif