123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687 |
- #include <linux/linkage.h>
- /*
- * Unsigned modulo operation for 32 bit integers.
- * Input : op1 in Reg r5
- * op2 in Reg r6
- * Output: op1 mod op2 in Reg r3
- */
- .text
- .globl __umodsi3
- .type __umodsi3, @function
- .ent __umodsi3
- __umodsi3:
- .frame r1, 0, r15
- addik r1, r1, -12
- swi r29, r1, 0
- swi r30, r1, 4
- swi r31, r1, 8
- beqi r6, div_by_zero /* div_by_zero - division error */
- beqid r5, result_is_zero /* result is zero */
- addik r3, r0, 0 /* clear div */
- addik r30, r0, 0 /* clear mod */
- addik r29, r0, 32 /* initialize the loop count */
- /* check if r6 and r5 are equal /* if yes, return 0 */
- rsub r18, r5, r6
- beqi r18, return_here
- /* check if (uns)r6 is greater than (uns)r5. in that case, just return r5 */
- xor r18, r5, r6
- bgeid r18, 16
- addik r3, r5, 0
- blti r6, return_here
- bri $lcheckr6
- rsub r18, r5, r6 /* microblazecmp */
- bgti r18, return_here
- /* if r6 [bit 31] is set, then return result as r5-r6 */
- $lcheckr6:
- bgtid r6, div0
- addik r3, r0, 0
- addik r18, r0, 0x7fffffff
- and r5, r5, r18
- and r6, r6, r18
- brid return_here
- rsub r3, r6, r5
- /* first part: try to find the first '1' in the r5 */
- div0:
- blti r5, div2
- div1:
- add r5, r5, r5 /* left shift logical r5 */
- bgeid r5, div1
- addik r29, r29, -1
- div2:
- /* left shift logical r5 get the '1' into the carry */
- add r5, r5, r5
- addc r3, r3, r3 /* move that bit into the mod register */
- rsub r31, r6, r3 /* try to subtract (r3 a r6) */
- blti r31, mod_too_small
- /* move the r31 to mod since the result was positive */
- or r3, r0, r31
- addik r30, r30, 1
- mod_too_small:
- addik r29, r29, -1
- beqi r29, loop_end
- add r30, r30, r30 /* shift in the '1' into div */
- bri div2 /* div2 */
- loop_end:
- bri return_here
- div_by_zero:
- result_is_zero:
- or r3, r0, r0 /* set result to 0 */
- return_here:
- /* restore values of csrs and that of r3 and the divisor and the dividend */
- lwi r29, r1, 0
- lwi r30, r1, 4
- lwi r31, r1, 8
- rtsd r15, 8
- addik r1, r1, 12
- .size __umodsi3, . - __umodsi3
- .end __umodsi3
|