moddi3.S 2.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. //===----------------------Hexagon builtin routine ------------------------===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. .macro FUNCTION_BEGIN name
  9. .text
  10. .p2align 5
  11. .globl \name
  12. .type \name, @function
  13. \name:
  14. .endm
  15. .macro FUNCTION_END name
  16. .size \name, . - \name
  17. .endm
  18. FUNCTION_BEGIN __hexagon_moddi3
  19. {
  20. p3 = tstbit(r1,#31)
  21. }
  22. {
  23. r1:0 = abs(r1:0)
  24. r3:2 = abs(r3:2)
  25. }
  26. {
  27. r6 = cl0(r1:0) // count leading 0's of dividend (numerator)
  28. r7 = cl0(r3:2) // count leading 0's of divisor (denominator)
  29. r5:4 = r3:2 // divisor moved into working registers
  30. r3:2 = r1:0 // dividend is the initial remainder, r3:2 contains remainder
  31. }
  32. {
  33. r10 = sub(r7,r6) // left shift count for bit & divisor
  34. r1:0 = #0 // initialize quotient to 0
  35. r15:14 = #1 // initialize bit to 1
  36. }
  37. {
  38. r11 = add(r10,#1) // loop count is 1 more than shift count
  39. r13:12 = lsl(r5:4,r10) // shift divisor msb into same bit position as dividend msb
  40. r15:14 = lsl(r15:14,r10) // shift the bit left by same amount as divisor
  41. }
  42. {
  43. p0 = cmp.gtu(r5:4,r3:2) // check if divisor > dividend
  44. loop0(1f,r11) // register loop
  45. }
  46. {
  47. if (p0) jump .hexagon_moddi3_return // if divisor > dividend, we're done, so return
  48. }
  49. .falign
  50. 1:
  51. {
  52. p0 = cmp.gtu(r13:12,r3:2) // set predicate reg if shifted divisor > current remainder
  53. }
  54. {
  55. r7:6 = sub(r3:2, r13:12) // subtract shifted divisor from current remainder
  56. r9:8 = add(r1:0, r15:14) // save current quotient to temp (r9:8)
  57. }
  58. {
  59. r1:0 = vmux(p0, r1:0, r9:8) // choose either current quotient or new quotient (r9:8)
  60. r3:2 = vmux(p0, r3:2, r7:6) // choose either current remainder or new remainder (r7:6)
  61. }
  62. {
  63. r15:14 = lsr(r15:14, #1) // shift bit right by 1 for next iteration
  64. r13:12 = lsr(r13:12, #1) // shift "shifted divisor" right by 1 for next iteration
  65. }:endloop0
  66. .hexagon_moddi3_return:
  67. {
  68. r1:0 = neg(r3:2)
  69. }
  70. {
  71. r1:0 = vmux(p3,r1:0,r3:2)
  72. jumpr r31
  73. }
  74. FUNCTION_END __hexagon_moddi3
  75. .globl __qdsp_moddi3
  76. .set __qdsp_moddi3, __hexagon_moddi3