1 /* SPDX-License-Identifier: GPL-2.0 */
3 * linux/arch/arm/lib/div64.S
5 * Optimized computation of 64-bit dividend / 32-bit divisor
7 * Author: Nicolas Pitre
9 * Copyright: Monta Vista Software, Inc.
12 #include <linux/linkage.h>
13 #include <asm/assembler.h>
31 * __do_div64: perform a division with 64-bit dividend and 32-bit divisor.
33 * Note: Calling convention is totally non standard for optimal code.
34 * This is meant to be used by do_div() from include/asm/div64.h only.
37 * xh-xl = dividend (clobbered)
38 * r4 = divisor (preserved)
44 * Clobbered regs: xl, ip
47 .pushsection .text.__do_div64, "ax"
51 @ Test for easy paths first.
53 bls 9f @ divisor is 0 or 1
55 beq 8f @ divisor is power of 2
57 @ See if we need to handle upper 32-bit result.
62 @ Align divisor with upper part of dividend.
63 @ The aligned divisor is stored in yl preserving the original.
64 @ The bit position is stored in ip.
66 #if __LINUX_ARM_ARCH__ >= 5
79 1: cmp yl, #0x80000000
87 @ The division loop for needed upper bit positions.
88 @ Break out early if dividend reaches 0.
96 @ See if we need to handle lower 32-bit result.
103 @ The division loop for lower bit positions.
104 @ Here we shift remainer bits leftwards rather than moving the
105 @ divisor for comparisons, considering the carry-out bit as well.
107 4: movs xl, xl, lsl #1
117 @ The top part of remainder became zero. If carry is set
118 @ (the 33th bit) this is a false positive so resume the loop.
119 @ Otherwise, if lower part is also null then we are done.
124 @ We still have remainer bits in the low part. Bring them up.
126 #if __LINUX_ARM_ARCH__ >= 5
128 clz xh, xl @ we know xh is zero here so...
135 7: movs xl, xl, lsl #1
141 @ Current remainder is now 1. It is worthless to compare with
142 @ divisor at this point since divisor can not be smaller than 3 here.
143 @ If possible, branch for another shift in the division loop.
144 @ If no bit position left then we are done.
150 8: @ Division by a power of 2: determine what that divisor order is
151 @ then simply shift values around
153 #if __LINUX_ARM_ARCH__ >= 5
163 movhs yl, yl, lsr #16
176 addls ip, ip, yl, lsr #1
183 ARM( orr yl, yl, xh, lsl ip )
184 THUMB( lsl xh, xh, ip )
185 THUMB( orr yl, yl, xh )
190 @ eq -> division by 1: obvious enough...
205 @ as wrong as it could be...