dp_sub.c 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191
  1. /* IEEE754 floating point arithmetic
  2. * double precision: common utilities
  3. */
  4. /*
  5. * MIPS floating point support
  6. * Copyright (C) 1994-2000 Algorithmics Ltd.
  7. * http://www.algor.co.uk
  8. *
  9. * ########################################################################
  10. *
  11. * This program is free software; you can distribute it and/or modify it
  12. * under the terms of the GNU General Public License (Version 2) as
  13. * published by the Free Software Foundation.
  14. *
  15. * This program is distributed in the hope it will be useful, but WITHOUT
  16. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  17. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
  18. * for more details.
  19. *
  20. * You should have received a copy of the GNU General Public License along
  21. * with this program; if not, write to the Free Software Foundation, Inc.,
  22. * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
  23. *
  24. * ########################################################################
  25. */
  26. #include "ieee754dp.h"
  27. ieee754dp ieee754dp_sub(ieee754dp x, ieee754dp y)
  28. {
  29. COMPXDP;
  30. COMPYDP;
  31. EXPLODEXDP;
  32. EXPLODEYDP;
  33. CLEARCX;
  34. FLUSHXDP;
  35. FLUSHYDP;
  36. switch (CLPAIR(xc, yc)) {
  37. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
  38. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
  39. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
  40. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
  41. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
  42. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
  43. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
  44. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
  45. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
  46. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
  47. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
  48. SETCX(IEEE754_INVALID_OPERATION);
  49. return ieee754dp_nanxcpt(ieee754dp_indef(), "sub", x, y);
  50. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
  51. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
  52. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
  53. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
  54. return y;
  55. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
  56. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
  57. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
  58. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
  59. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
  60. return x;
  61. /* Infinity handling
  62. */
  63. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
  64. if (xs != ys)
  65. return x;
  66. SETCX(IEEE754_INVALID_OPERATION);
  67. return ieee754dp_xcpt(ieee754dp_indef(), "sub", x, y);
  68. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
  69. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
  70. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
  71. return ieee754dp_inf(ys ^ 1);
  72. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
  73. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
  74. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
  75. return x;
  76. /* Zero handling
  77. */
  78. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
  79. if (xs != ys)
  80. return x;
  81. else
  82. return ieee754dp_zero(ieee754_csr.rm ==
  83. IEEE754_RD);
  84. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
  85. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
  86. return x;
  87. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
  88. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
  89. /* quick fix up */
  90. DPSIGN(y) ^= 1;
  91. return y;
  92. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
  93. DPDNORMX;
  94. /* FAAL THOROUGH */
  95. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
  96. /* normalize ym,ye */
  97. DPDNORMY;
  98. break;
  99. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
  100. /* normalize xm,xe */
  101. DPDNORMX;
  102. break;
  103. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
  104. break;
  105. }
  106. /* flip sign of y and handle as add */
  107. ys ^= 1;
  108. assert(xm & DP_HIDDEN_BIT);
  109. assert(ym & DP_HIDDEN_BIT);
  110. /* provide guard,round and stick bit dpace */
  111. xm <<= 3;
  112. ym <<= 3;
  113. if (xe > ye) {
  114. /* have to shift y fraction right to align
  115. */
  116. int s = xe - ye;
  117. ym = XDPSRS(ym, s);
  118. ye += s;
  119. } else if (ye > xe) {
  120. /* have to shift x fraction right to align
  121. */
  122. int s = ye - xe;
  123. xm = XDPSRS(xm, s);
  124. xe += s;
  125. }
  126. assert(xe == ye);
  127. assert(xe <= DP_EMAX);
  128. if (xs == ys) {
  129. /* generate 28 bit result of adding two 27 bit numbers
  130. */
  131. xm = xm + ym;
  132. xe = xe;
  133. xs = xs;
  134. if (xm >> (DP_MBITS + 1 + 3)) { /* carry out */
  135. xm = XDPSRS1(xm); /* shift preserving sticky */
  136. xe++;
  137. }
  138. } else {
  139. if (xm >= ym) {
  140. xm = xm - ym;
  141. xe = xe;
  142. xs = xs;
  143. } else {
  144. xm = ym - xm;
  145. xe = xe;
  146. xs = ys;
  147. }
  148. if (xm == 0) {
  149. if (ieee754_csr.rm == IEEE754_RD)
  150. return ieee754dp_zero(1); /* round negative inf. => sign = -1 */
  151. else
  152. return ieee754dp_zero(0); /* other round modes => sign = 1 */
  153. }
  154. /* normalize to rounding precision
  155. */
  156. while ((xm >> (DP_MBITS + 3)) == 0) {
  157. xm <<= 1;
  158. xe--;
  159. }
  160. }
  161. DPNORMRET2(xs, xe, xm, "sub", x, y);
  162. }