dp_mul.c 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177
  1. /* IEEE754 floating point arithmetic
  2. * double precision: common utilities
  3. */
  4. /*
  5. * MIPS floating point support
  6. * Copyright (C) 1994-2000 Algorithmics Ltd.
  7. *
  8. * ########################################################################
  9. *
  10. * This program is free software; you can distribute it and/or modify it
  11. * under the terms of the GNU General Public License (Version 2) as
  12. * published by the Free Software Foundation.
  13. *
  14. * This program is distributed in the hope it will be useful, but WITHOUT
  15. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  16. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
  17. * for more details.
  18. *
  19. * You should have received a copy of the GNU General Public License along
  20. * with this program; if not, write to the Free Software Foundation, Inc.,
  21. * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
  22. *
  23. * ########################################################################
  24. */
  25. #include "ieee754dp.h"
  26. ieee754dp ieee754dp_mul(ieee754dp x, ieee754dp y)
  27. {
  28. COMPXDP;
  29. COMPYDP;
  30. EXPLODEXDP;
  31. EXPLODEYDP;
  32. CLEARCX;
  33. FLUSHXDP;
  34. FLUSHYDP;
  35. switch (CLPAIR(xc, yc)) {
  36. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
  37. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
  38. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
  39. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
  40. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
  41. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
  42. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
  43. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
  44. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
  45. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
  46. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
  47. SETCX(IEEE754_INVALID_OPERATION);
  48. return ieee754dp_nanxcpt(ieee754dp_indef(), "mul", x, y);
  49. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
  50. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
  51. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
  52. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
  53. return y;
  54. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
  55. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
  56. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
  57. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
  58. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
  59. return x;
  60. /* Infinity handling */
  61. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
  62. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
  63. SETCX(IEEE754_INVALID_OPERATION);
  64. return ieee754dp_xcpt(ieee754dp_indef(), "mul", x, y);
  65. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
  66. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
  67. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
  68. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
  69. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
  70. return ieee754dp_inf(xs ^ ys);
  71. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
  72. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
  73. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
  74. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
  75. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
  76. return ieee754dp_zero(xs ^ ys);
  77. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
  78. DPDNORMX;
  79. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
  80. DPDNORMY;
  81. break;
  82. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
  83. DPDNORMX;
  84. break;
  85. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
  86. break;
  87. }
  88. /* rm = xm * ym, re = xe+ye basically */
  89. assert(xm & DP_HIDDEN_BIT);
  90. assert(ym & DP_HIDDEN_BIT);
  91. {
  92. int re = xe + ye;
  93. int rs = xs ^ ys;
  94. u64 rm;
  95. /* shunt to top of word */
  96. xm <<= 64 - (DP_MBITS + 1);
  97. ym <<= 64 - (DP_MBITS + 1);
  98. /* multiply 32bits xm,ym to give high 32bits rm with stickness
  99. */
  100. /* 32 * 32 => 64 */
  101. #define DPXMULT(x, y) ((u64)(x) * (u64)y)
  102. {
  103. unsigned lxm = xm;
  104. unsigned hxm = xm >> 32;
  105. unsigned lym = ym;
  106. unsigned hym = ym >> 32;
  107. u64 lrm;
  108. u64 hrm;
  109. lrm = DPXMULT(lxm, lym);
  110. hrm = DPXMULT(hxm, hym);
  111. {
  112. u64 t = DPXMULT(lxm, hym);
  113. {
  114. u64 at =
  115. lrm + (t << 32);
  116. hrm += at < lrm;
  117. lrm = at;
  118. }
  119. hrm = hrm + (t >> 32);
  120. }
  121. {
  122. u64 t = DPXMULT(hxm, lym);
  123. {
  124. u64 at =
  125. lrm + (t << 32);
  126. hrm += at < lrm;
  127. lrm = at;
  128. }
  129. hrm = hrm + (t >> 32);
  130. }
  131. rm = hrm | (lrm != 0);
  132. }
  133. /*
  134. * sticky shift down to normal rounding precision
  135. */
  136. if ((s64) rm < 0) {
  137. rm =
  138. (rm >> (64 - (DP_MBITS + 1 + 3))) |
  139. ((rm << (DP_MBITS + 1 + 3)) != 0);
  140. re++;
  141. } else {
  142. rm =
  143. (rm >> (64 - (DP_MBITS + 1 + 3 + 1))) |
  144. ((rm << (DP_MBITS + 1 + 3 + 1)) != 0);
  145. }
  146. assert(rm & (DP_HIDDEN_BIT << 3));
  147. DPNORMRET2(rs, re, rm, "mul", x, y);
  148. }
  149. }