fastmath2_ldlib_asm.S 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. //===----------------------Hexagon builtin routine ------------------------===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. /* ==================================================================== *
  9. fast2_QLDOUBLE fast2_ldadd(fast2_QLDOUBLE a,fast2_QLDOUBLE b) {
  10. fast2_QLDOUBLE c;
  11. lint manta = a & MANTMASK;
  12. int expa = Q6_R_sxth_R(a) ;
  13. lint mantb = b & MANTMASK;
  14. int expb = Q6_R_sxth_R(b) ;
  15. int exp, expdiff, j, k, hi, lo, cn;
  16. lint mant;
  17. expdiff = (int) Q6_P_vabsdiffh_PP(a, b);
  18. expdiff = Q6_R_sxth_R(expdiff) ;
  19. if (expdiff > 63) { expdiff = 62;}
  20. if (expa > expb) {
  21. exp = expa + 1;
  22. expa = 1;
  23. expb = expdiff + 1;
  24. } else {
  25. exp = expb + 1;
  26. expb = 1;
  27. expa = expdiff + 1;
  28. }
  29. mant = (manta>>expa) + (mantb>>expb);
  30. hi = (int) (mant>>32);
  31. lo = (int) (mant);
  32. k = Q6_R_normamt_R(hi);
  33. if(hi == 0 || hi == -1) k = 31+Q6_R_normamt_R(lo);
  34. mant = (mant << k);
  35. cn = (mant == 0x8000000000000000LL);
  36. exp = exp - k + cn;
  37. if (mant == 0 || mant == -1) exp = 0x8001;
  38. c = (mant & MANTMASK) | (((lint) exp) & EXP_MASK);
  39. return(c);
  40. }
  41. * ==================================================================== */
  42. .text
  43. .global fast2_ldadd_asm
  44. .type fast2_ldadd_asm, @function
  45. fast2_ldadd_asm:
  46. #define manta R1:0
  47. #define lmanta R1:0
  48. #define mantb R3:2
  49. #define lmantb R3:2
  50. #define expa R4
  51. #define expb R5
  52. #define expd R6
  53. #define exp R8
  54. #define c63 R9
  55. #define lmant R1:0
  56. #define k R4
  57. #define ce P0
  58. #define zero R3:2
  59. .falign
  60. {
  61. expa = memw(r29+#8)
  62. expb = memw(r29+#24)
  63. r7 = r0
  64. }
  65. {
  66. expd = sub(expa, expb):sat
  67. ce = CMP.GT(expa, expb);
  68. if ( ce.new) exp = add(expa, #1)
  69. if (!ce.new) exp = add(expb, #1)
  70. } {
  71. expd = abs(expd):sat
  72. if ( ce) expa = #1
  73. if (!ce) expb = #1
  74. c63 = #62
  75. } {
  76. expd = MIN(expd, c63)
  77. manta = memd(r29+#0)
  78. mantb = memd(r29+#16)
  79. } {
  80. if (!ce) expa = add(expd, #1)
  81. if ( ce) expb = add(expd, #1)
  82. } {
  83. lmanta = ASR(lmanta, expa)
  84. lmantb = ASR(lmantb, expb)
  85. } {
  86. lmant = add(lmanta, lmantb)
  87. zero = #0
  88. } {
  89. k = clb(lmant)
  90. c63.L =#0x0001
  91. } {
  92. exp -= add(k, #-1) //exp = exp - (k-1)
  93. k = add(k, #-1)
  94. p0 = cmp.gt(k, #58)
  95. c63.H =#0x8000
  96. } {
  97. if(!p0)memw(r7+#8) = exp
  98. lmant = ASL(lmant, k)
  99. if(p0) jump .Ldenorma
  100. } {
  101. memd(r7+#0) = lmant
  102. jumpr r31
  103. }
  104. .Ldenorma:
  105. memd(r7+#0) = zero
  106. {
  107. memw(r7+#8) = c63
  108. jumpr r31
  109. }
  110. /* =================================================================== *
  111. fast2_QLDOUBLE fast2_ldsub(fast2_QLDOUBLE a,fast2_QLDOUBLE b) {
  112. fast2_QLDOUBLE c;
  113. lint manta = a & MANTMASK;
  114. int expa = Q6_R_sxth_R(a) ;
  115. lint mantb = b & MANTMASK;
  116. int expb = Q6_R_sxth_R(b) ;
  117. int exp, expdiff, j, k;
  118. lint mant;
  119. expdiff = (int) Q6_P_vabsdiffh_PP(a, b);
  120. expdiff = Q6_R_sxth_R(expdiff) ;
  121. if (expdiff > 63) { expdiff = 62;}
  122. if (expa > expb) {
  123. exp = expa + 1;
  124. expa = 1;
  125. expb = expdiff + 1;
  126. } else {
  127. exp = expb + 1;
  128. expb = 1;
  129. expa = expdiff + 1;
  130. }
  131. mant = (manta>>expa) - (mantb>>expb);
  132. k = Q6_R_clb_P(mant)-1;
  133. mant = (mant << k);
  134. exp = exp - k;
  135. if (mant == 0 || mant == -1) exp = 0x8001;
  136. c = (mant & MANTMASK) | (((lint) exp) & EXP_MASK);
  137. return(c);
  138. }
  139. * ==================================================================== */
  140. .text
  141. .global fast2_ldsub_asm
  142. .type fast2_ldsub_asm, @function
  143. fast2_ldsub_asm:
  144. #define manta R1:0
  145. #define lmanta R1:0
  146. #define mantb R3:2
  147. #define lmantb R3:2
  148. #define expa R4
  149. #define expb R5
  150. #define expd R6
  151. #define exp R8
  152. #define c63 R9
  153. #define lmant R1:0
  154. #define k R4
  155. #define ce P0
  156. #define zero R3:2
  157. .falign
  158. {
  159. expa = memw(r29+#8)
  160. expb = memw(r29+#24)
  161. r7 = r0
  162. }
  163. {
  164. expd = sub(expa, expb):sat
  165. ce = CMP.GT(expa, expb);
  166. if ( ce.new) exp = add(expa, #1)
  167. if (!ce.new) exp = add(expb, #1)
  168. } {
  169. expd = abs(expd):sat
  170. if ( ce) expa = #1
  171. if (!ce) expb = #1
  172. c63 = #62
  173. } {
  174. expd = min(expd, c63)
  175. manta = memd(r29+#0)
  176. mantb = memd(r29+#16)
  177. } {
  178. if (!ce) expa = add(expd, #1)
  179. if ( ce) expb = add(expd, #1)
  180. } {
  181. lmanta = ASR(lmanta, expa)
  182. lmantb = ASR(lmantb, expb)
  183. } {
  184. lmant = sub(lmanta, lmantb)
  185. zero = #0
  186. } {
  187. k = clb(lmant)
  188. c63.L =#0x0001
  189. } {
  190. exp -= add(k, #-1) //exp = exp - (k+1)
  191. k = add(k, #-1)
  192. p0 = cmp.gt(k, #58)
  193. c63.H =#0x8000
  194. } {
  195. if(!p0)memw(r7+#8) = exp
  196. lmant = asl(lmant, k)
  197. if(p0) jump .Ldenorma_s
  198. } {
  199. memd(r7+#0) = lmant
  200. jumpr r31
  201. }
  202. .Ldenorma_s:
  203. memd(r7+#0) = zero
  204. {
  205. memw(r7+#8) = c63
  206. jumpr r31
  207. }
  208. /* ==================================================================== *
  209. fast2_QLDOUBLE fast2_ldmpy(fast2_QLDOUBLE a,fast2_QLDOUBLE b) {
  210. fast2_QLDOUBLE c;
  211. lint manta = a & MANTMASK;
  212. int expa = Q6_R_sxth_R(a) ;
  213. lint mantb = b & MANTMASK;
  214. int expb = Q6_R_sxth_R(b) ;
  215. int exp, k;
  216. lint mant;
  217. int hia, hib, hi, lo;
  218. unsigned int loa, lob;
  219. hia = (int)(a >> 32);
  220. loa = Q6_R_extractu_RII((int)manta, 31, 1);
  221. hib = (int)(b >> 32);
  222. lob = Q6_R_extractu_RII((int)mantb, 31, 1);
  223. mant = Q6_P_mpy_RR(hia, lob);
  224. mant = Q6_P_mpyacc_RR(mant,hib, loa);
  225. mant = (mant >> 30) + (Q6_P_mpy_RR(hia, hib)<<1);
  226. hi = (int) (mant>>32);
  227. k = Q6_R_normamt_R(hi);
  228. mant = mant << k;
  229. exp = expa + expb - k;
  230. if (mant == 0 || mant == -1) exp = 0x8001;
  231. c = (mant & MANTMASK) | (((lint) exp) & EXP_MASK);
  232. return(c);
  233. }
  234. * ==================================================================== */
  235. .text
  236. .global fast2_ldmpy_asm
  237. .type fast2_ldmpy_asm, @function
  238. fast2_ldmpy_asm:
  239. #define mantxl_ R9
  240. #define mantxl R14
  241. #define mantxh R15
  242. #define mantx R15:14
  243. #define mantbl R2
  244. #define mantbl_ R8
  245. #define mantbh R3
  246. #define mantb R3:2
  247. #define expa R4
  248. #define expb R5
  249. #define c8001 R8
  250. #define mantd R7:6
  251. #define lmantc R11:10
  252. #define kp R9
  253. #define min R13:12
  254. #define minh R13
  255. #define max R13:12
  256. #define maxh R13
  257. #define ret R0
  258. .falign
  259. {
  260. mantx = memd(r29+#0)
  261. mantb = memd(r29+#16)
  262. min = #0
  263. }
  264. {
  265. mantbl_= extractu(mantbl, #31, #1)
  266. mantxl_= extractu(mantxl, #31, #1)
  267. minh.H = #0x8000
  268. }
  269. {
  270. lmantc = mpy(mantxh, mantbh)
  271. mantd = mpy(mantxh, mantbl_)
  272. expa = memw(r29+#8)
  273. expb = memw(r29+#24)
  274. }
  275. {
  276. lmantc = add(lmantc, lmantc)
  277. mantd += mpy(mantbh, mantxl_)
  278. }
  279. {
  280. mantd = asr(mantd, #30)
  281. c8001.L = #0x0001
  282. p1 = cmp.eq(mantx, mantb)
  283. }
  284. {
  285. mantd = add(mantd, lmantc)
  286. expa= add(expa, expb)
  287. p2 = cmp.eq(mantb, min)
  288. }
  289. {
  290. kp = clb(mantd)
  291. c8001.H = #0x8000
  292. p1 = and(p1, p2)
  293. }
  294. {
  295. expa-= add(kp, #-1)
  296. kp = add(kp, #-1)
  297. if(p1) jump .Lsat
  298. }
  299. {
  300. mantd = asl(mantd, kp)
  301. memw(ret+#8) = expa
  302. p0 = cmp.gt(kp, #58)
  303. if(p0.new) jump:NT .Ldenorm //rarely happens
  304. }
  305. {
  306. memd(ret+#0) = mantd
  307. jumpr r31
  308. }
  309. .Lsat:
  310. {
  311. max = #0
  312. expa+= add(kp, #1)
  313. }
  314. {
  315. maxh.H = #0x4000
  316. memw(ret+#8) = expa
  317. }
  318. {
  319. memd(ret+#0) = max
  320. jumpr r31
  321. }
  322. .Ldenorm:
  323. {
  324. memw(ret+#8) = c8001
  325. mantx = #0
  326. }
  327. {
  328. memd(ret+#0) = mantx
  329. jumpr r31
  330. }