sp_mul.c 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171
  1. /* IEEE754 floating point arithmetic
  2. * single precision
  3. */
  4. /*
  5. * MIPS floating point support
  6. * Copyright (C) 1994-2000 Algorithmics Ltd.
  7. * http://www.algor.co.uk
  8. *
  9. * ########################################################################
  10. *
  11. * This program is free software; you can distribute it and/or modify it
  12. * under the terms of the GNU General Public License (Version 2) as
  13. * published by the Free Software Foundation.
  14. *
  15. * This program is distributed in the hope it will be useful, but WITHOUT
  16. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  17. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
  18. * for more details.
  19. *
  20. * You should have received a copy of the GNU General Public License along
  21. * with this program; if not, write to the Free Software Foundation, Inc.,
  22. * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
  23. *
  24. * ########################################################################
  25. */
  26. #include "ieee754sp.h"
  27. ieee754sp ieee754sp_mul(ieee754sp x, ieee754sp y)
  28. {
  29. COMPXSP;
  30. COMPYSP;
  31. EXPLODEXSP;
  32. EXPLODEYSP;
  33. CLEARCX;
  34. FLUSHXSP;
  35. FLUSHYSP;
  36. switch (CLPAIR(xc, yc)) {
  37. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
  38. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
  39. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
  40. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
  41. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
  42. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
  43. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
  44. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
  45. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
  46. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
  47. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
  48. SETCX(IEEE754_INVALID_OPERATION);
  49. return ieee754sp_nanxcpt(ieee754sp_indef(), "mul", x, y);
  50. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
  51. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
  52. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
  53. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
  54. return y;
  55. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
  56. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
  57. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
  58. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
  59. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
  60. return x;
  61. /* Infinity handling */
  62. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
  63. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
  64. SETCX(IEEE754_INVALID_OPERATION);
  65. return ieee754sp_xcpt(ieee754sp_indef(), "mul", x, y);
  66. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
  67. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
  68. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
  69. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
  70. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
  71. return ieee754sp_inf(xs ^ ys);
  72. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
  73. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
  74. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
  75. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
  76. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
  77. return ieee754sp_zero(xs ^ ys);
  78. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
  79. SPDNORMX;
  80. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
  81. SPDNORMY;
  82. break;
  83. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
  84. SPDNORMX;
  85. break;
  86. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
  87. break;
  88. }
  89. /* rm = xm * ym, re = xe+ye basicly */
  90. assert(xm & SP_HIDDEN_BIT);
  91. assert(ym & SP_HIDDEN_BIT);
  92. {
  93. int re = xe + ye;
  94. int rs = xs ^ ys;
  95. unsigned rm;
  96. /* shunt to top of word */
  97. xm <<= 32 - (SP_MBITS + 1);
  98. ym <<= 32 - (SP_MBITS + 1);
  99. /* multiply 32bits xm,ym to give high 32bits rm with stickness
  100. */
  101. {
  102. unsigned short lxm = xm & 0xffff;
  103. unsigned short hxm = xm >> 16;
  104. unsigned short lym = ym & 0xffff;
  105. unsigned short hym = ym >> 16;
  106. unsigned lrm;
  107. unsigned hrm;
  108. lrm = lxm * lym; /* 16 * 16 => 32 */
  109. hrm = hxm * hym; /* 16 * 16 => 32 */
  110. {
  111. unsigned t = lxm * hym; /* 16 * 16 => 32 */
  112. {
  113. unsigned at = lrm + (t << 16);
  114. hrm += at < lrm;
  115. lrm = at;
  116. }
  117. hrm = hrm + (t >> 16);
  118. }
  119. {
  120. unsigned t = hxm * lym; /* 16 * 16 => 32 */
  121. {
  122. unsigned at = lrm + (t << 16);
  123. hrm += at < lrm;
  124. lrm = at;
  125. }
  126. hrm = hrm + (t >> 16);
  127. }
  128. rm = hrm | (lrm != 0);
  129. }
  130. /*
  131. * sticky shift down to normal rounding precision
  132. */
  133. if ((int) rm < 0) {
  134. rm = (rm >> (32 - (SP_MBITS + 1 + 3))) |
  135. ((rm << (SP_MBITS + 1 + 3)) != 0);
  136. re++;
  137. } else {
  138. rm = (rm >> (32 - (SP_MBITS + 1 + 3 + 1))) |
  139. ((rm << (SP_MBITS + 1 + 3 + 1)) != 0);
  140. }
  141. assert(rm & (SP_HIDDEN_BIT << 3));
  142. SPNORMRET2(rs, re, rm, "mul", x, y);
  143. }
  144. }