sp_mul.c 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /* IEEE754 floating point arithmetic
  3. * single precision
  4. */
  5. /*
  6. * MIPS floating point support
  7. * Copyright (C) 1994-2000 Algorithmics Ltd.
  8. */
  9. #include "ieee754sp.h"
  10. union ieee754sp ieee754sp_mul(union ieee754sp x, union ieee754sp y)
  11. {
  12. int re;
  13. int rs;
  14. unsigned int rm;
  15. unsigned short lxm;
  16. unsigned short hxm;
  17. unsigned short lym;
  18. unsigned short hym;
  19. unsigned int lrm;
  20. unsigned int hrm;
  21. unsigned int t;
  22. unsigned int at;
  23. COMPXSP;
  24. COMPYSP;
  25. EXPLODEXSP;
  26. EXPLODEYSP;
  27. ieee754_clearcx();
  28. FLUSHXSP;
  29. FLUSHYSP;
  30. switch (CLPAIR(xc, yc)) {
  31. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
  32. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
  33. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
  34. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
  35. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
  36. return ieee754sp_nanxcpt(y);
  37. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
  38. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
  39. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
  40. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
  41. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
  42. case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
  43. return ieee754sp_nanxcpt(x);
  44. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
  45. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
  46. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
  47. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
  48. return y;
  49. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
  50. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
  51. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
  52. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
  53. case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
  54. return x;
  55. /*
  56. * Infinity handling
  57. */
  58. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
  59. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
  60. ieee754_setcx(IEEE754_INVALID_OPERATION);
  61. return ieee754sp_indef();
  62. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
  63. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
  64. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
  65. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
  66. case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
  67. return ieee754sp_inf(xs ^ ys);
  68. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
  69. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
  70. case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
  71. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
  72. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
  73. return ieee754sp_zero(xs ^ ys);
  74. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
  75. SPDNORMX;
  76. fallthrough;
  77. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
  78. SPDNORMY;
  79. break;
  80. case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
  81. SPDNORMX;
  82. break;
  83. case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
  84. break;
  85. }
  86. /* rm = xm * ym, re = xe+ye basically */
  87. assert(xm & SP_HIDDEN_BIT);
  88. assert(ym & SP_HIDDEN_BIT);
  89. re = xe + ye;
  90. rs = xs ^ ys;
  91. /* shunt to top of word */
  92. xm <<= 32 - (SP_FBITS + 1);
  93. ym <<= 32 - (SP_FBITS + 1);
  94. /*
  95. * Multiply 32 bits xm, ym to give high 32 bits rm with stickness.
  96. */
  97. lxm = xm & 0xffff;
  98. hxm = xm >> 16;
  99. lym = ym & 0xffff;
  100. hym = ym >> 16;
  101. lrm = lxm * lym; /* 16 * 16 => 32 */
  102. hrm = hxm * hym; /* 16 * 16 => 32 */
  103. t = lxm * hym; /* 16 * 16 => 32 */
  104. at = lrm + (t << 16);
  105. hrm += at < lrm;
  106. lrm = at;
  107. hrm = hrm + (t >> 16);
  108. t = hxm * lym; /* 16 * 16 => 32 */
  109. at = lrm + (t << 16);
  110. hrm += at < lrm;
  111. lrm = at;
  112. hrm = hrm + (t >> 16);
  113. rm = hrm | (lrm != 0);
  114. /*
  115. * Sticky shift down to normal rounding precision.
  116. */
  117. if ((int) rm < 0) {
  118. rm = (rm >> (32 - (SP_FBITS + 1 + 3))) |
  119. ((rm << (SP_FBITS + 1 + 3)) != 0);
  120. re++;
  121. } else {
  122. rm = (rm >> (32 - (SP_FBITS + 1 + 3 + 1))) |
  123. ((rm << (SP_FBITS + 1 + 3 + 1)) != 0);
  124. }
  125. assert(rm & (SP_HIDDEN_BIT << 3));
  126. return ieee754sp_format(rs, re, rm);
  127. }