divu.S 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899
  1. ;; Copyright 2010 Free Software Foundation, Inc.
  2. ;; Contributed by Bernd Schmidt <bernds@codesourcery.com>.
  3. ;;
  4. ;; This program is free software; you can redistribute it and/or modify
  5. ;; it under the terms of the GNU General Public License as published by
  6. ;; the Free Software Foundation; either version 2 of the License, or
  7. ;; (at your option) any later version.
  8. ;;
  9. ;; This program is distributed in the hope that it will be useful,
  10. ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. ;; GNU General Public License for more details.
  13. ;;
  14. ;; You should have received a copy of the GNU General Public License
  15. ;; along with this program; if not, write to the Free Software
  16. ;; Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
  17. #include <linux/linkage.h>
  18. ;; ABI considerations for the divide functions
  19. ;; The following registers are call-used:
  20. ;; __c6xabi_divi A0,A1,A2,A4,A6,B0,B1,B2,B4,B5
  21. ;; __c6xabi_divu A0,A1,A2,A4,A6,B0,B1,B2,B4
  22. ;; __c6xabi_remi A1,A2,A4,A5,A6,B0,B1,B2,B4
  23. ;; __c6xabi_remu A1,A4,A5,A7,B0,B1,B2,B4
  24. ;;
  25. ;; In our implementation, divu and remu are leaf functions,
  26. ;; while both divi and remi call into divu.
  27. ;; A0 is not clobbered by any of the functions.
  28. ;; divu does not clobber B2 either, which is taken advantage of
  29. ;; in remi.
  30. ;; divi uses B5 to hold the original return address during
  31. ;; the call to divu.
  32. ;; remi uses B2 and A5 to hold the input values during the
  33. ;; call to divu. It stores B3 in on the stack.
  34. .text
  35. ENTRY(__c6xabi_divu)
  36. ;; We use a series of up to 31 subc instructions. First, we find
  37. ;; out how many leading zero bits there are in the divisor. This
  38. ;; gives us both a shift count for aligning (shifting) the divisor
  39. ;; to the, and the number of times we have to execute subc.
  40. ;; At the end, we have both the remainder and most of the quotient
  41. ;; in A4. The top bit of the quotient is computed first and is
  42. ;; placed in A2.
  43. ;; Return immediately if the dividend is zero.
  44. mv .s2x A4, B1
  45. [B1] lmbd .l2 1, B4, B1
  46. || [!B1] b .s2 B3 ; RETURN A
  47. || [!B1] mvk .d2 1, B4
  48. mv .l1x B1, A6
  49. || shl .s2 B4, B1, B4
  50. ;; The loop performs a maximum of 28 steps, so we do the
  51. ;; first 3 here.
  52. cmpltu .l1x A4, B4, A2
  53. [!A2] sub .l1x A4, B4, A4
  54. || shru .s2 B4, 1, B4
  55. || xor .s1 1, A2, A2
  56. shl .s1 A2, 31, A2
  57. || [B1] subc .l1x A4,B4,A4
  58. || [B1] add .s2 -1, B1, B1
  59. [B1] subc .l1x A4,B4,A4
  60. || [B1] add .s2 -1, B1, B1
  61. ;; RETURN A may happen here (note: must happen before the next branch)
  62. _divu_loop:
  63. cmpgt .l2 B1, 7, B0
  64. || [B1] subc .l1x A4,B4,A4
  65. || [B1] add .s2 -1, B1, B1
  66. [B1] subc .l1x A4,B4,A4
  67. || [B1] add .s2 -1, B1, B1
  68. || [B0] b .s1 _divu_loop
  69. [B1] subc .l1x A4,B4,A4
  70. || [B1] add .s2 -1, B1, B1
  71. [B1] subc .l1x A4,B4,A4
  72. || [B1] add .s2 -1, B1, B1
  73. [B1] subc .l1x A4,B4,A4
  74. || [B1] add .s2 -1, B1, B1
  75. [B1] subc .l1x A4,B4,A4
  76. || [B1] add .s2 -1, B1, B1
  77. [B1] subc .l1x A4,B4,A4
  78. || [B1] add .s2 -1, B1, B1
  79. ;; loop backwards branch happens here
  80. ret .s2 B3
  81. || mvk .s1 32, A1
  82. sub .l1 A1, A6, A6
  83. shl .s1 A4, A6, A4
  84. shru .s1 A4, 1, A4
  85. || sub .l1 A6, 1, A6
  86. or .l1 A2, A4, A4
  87. shru .s1 A4, A6, A4
  88. nop
  89. ENDPROC(__c6xabi_divu)