blob: 57282d5b51c049c8a3be8b96bc8ce28f130318ed [file] [log] [blame]
Edward O'Callaghan37a6a452009-08-07 20:30:09 +00001/* ===-- udivmoddi4.c - Implement __udivmoddi4 -----------------------------===
2 *
3 * The LLVM Compiler Infrastructure
4 *
Howard Hinnant9ad441f2010-11-16 22:13:33 +00005 * This file is dual licensed under the MIT and the University of Illinois Open
6 * Source Licenses. See LICENSE.TXT for details.
Edward O'Callaghan37a6a452009-08-07 20:30:09 +00007 *
8 * ===----------------------------------------------------------------------===
9 *
10 * This file implements __udivmoddi4 for the compiler_rt library.
11 *
12 * ===----------------------------------------------------------------------===
13 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000014
15#include "int_lib.h"
16
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000017/* Effects: if rem != 0, *rem = a % b
18 * Returns: a / b
19 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000020
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000021/* Translated from Figure 3-40 of The PowerPC Compiler Writer's Guide */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000022
Anton Korobeynikov1c5f89b2011-04-19 17:52:09 +000023COMPILER_RT_ABI du_int
Daniel Dunbarb3a69012009-06-26 16:47:03 +000024__udivmoddi4(du_int a, du_int b, du_int* rem)
25{
26 const unsigned n_uword_bits = sizeof(su_int) * CHAR_BIT;
27 const unsigned n_udword_bits = sizeof(du_int) * CHAR_BIT;
28 udwords n;
29 n.all = a;
30 udwords d;
31 d.all = b;
32 udwords q;
33 udwords r;
34 unsigned sr;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000035 /* special cases, X is unknown, K != 0 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000036 if (n.s.high == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +000037 {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000038 if (d.s.high == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +000039 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000040 /* 0 X
41 * ---
42 * 0 X
43 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000044 if (rem)
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000045 *rem = n.s.low % d.s.low;
46 return n.s.low / d.s.low;
Daniel Dunbarb3a69012009-06-26 16:47:03 +000047 }
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000048 /* 0 X
49 * ---
50 * K X
51 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000052 if (rem)
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000053 *rem = n.s.low;
Daniel Dunbarb3a69012009-06-26 16:47:03 +000054 return 0;
55 }
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000056 /* n.s.high != 0 */
57 if (d.s.low == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +000058 {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000059 if (d.s.high == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +000060 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000061 /* K X
62 * ---
63 * 0 0
64 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000065 if (rem)
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000066 *rem = n.s.high % d.s.low;
67 return n.s.high / d.s.low;
Daniel Dunbarb3a69012009-06-26 16:47:03 +000068 }
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000069 /* d.s.high != 0 */
70 if (n.s.low == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +000071 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000072 /* K 0
73 * ---
74 * K 0
75 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000076 if (rem)
77 {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000078 r.s.high = n.s.high % d.s.high;
79 r.s.low = 0;
Daniel Dunbarb3a69012009-06-26 16:47:03 +000080 *rem = r.all;
81 }
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000082 return n.s.high / d.s.high;
Daniel Dunbarb3a69012009-06-26 16:47:03 +000083 }
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000084 /* K K
85 * ---
86 * K 0
87 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000088 if ((d.s.high & (d.s.high - 1)) == 0) /* if d is a power of 2 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +000089 {
90 if (rem)
91 {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000092 r.s.low = n.s.low;
93 r.s.high = n.s.high & (d.s.high - 1);
Daniel Dunbarb3a69012009-06-26 16:47:03 +000094 *rem = r.all;
95 }
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +000096 return n.s.high >> __builtin_ctz(d.s.high);
Daniel Dunbarb3a69012009-06-26 16:47:03 +000097 }
Edward O'Callaghan37a6a452009-08-07 20:30:09 +000098 /* K K
99 * ---
100 * K 0
101 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000102 sr = __builtin_clz(d.s.high) - __builtin_clz(n.s.high);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000103 /* 0 <= sr <= n_uword_bits - 2 or sr large */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000104 if (sr > n_uword_bits - 2)
105 {
106 if (rem)
107 *rem = n.all;
108 return 0;
109 }
110 ++sr;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000111 /* 1 <= sr <= n_uword_bits - 1 */
112 /* q.all = n.all << (n_udword_bits - sr); */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000113 q.s.low = 0;
114 q.s.high = n.s.low << (n_uword_bits - sr);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000115 /* r.all = n.all >> sr; */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000116 r.s.high = n.s.high >> sr;
117 r.s.low = (n.s.high << (n_uword_bits - sr)) | (n.s.low >> sr);
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000118 }
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000119 else /* d.s.low != 0 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000120 {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000121 if (d.s.high == 0)
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000122 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000123 /* K X
124 * ---
125 * 0 K
126 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000127 if ((d.s.low & (d.s.low - 1)) == 0) /* if d is a power of 2 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000128 {
129 if (rem)
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000130 *rem = n.s.low & (d.s.low - 1);
131 if (d.s.low == 1)
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000132 return n.all;
Joerg Sonnenbergerd4260912011-07-28 19:47:33 +0000133 sr = __builtin_ctz(d.s.low);
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000134 q.s.high = n.s.high >> sr;
135 q.s.low = (n.s.high << (n_uword_bits - sr)) | (n.s.low >> sr);
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000136 return q.all;
137 }
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000138 /* K X
139 * ---
140 *0 K
141 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000142 sr = 1 + n_uword_bits + __builtin_clz(d.s.low) - __builtin_clz(n.s.high);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000143 /* 2 <= sr <= n_udword_bits - 1
144 * q.all = n.all << (n_udword_bits - sr);
145 * r.all = n.all >> sr;
146 * if (sr == n_uword_bits)
147 * {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000148 * q.s.low = 0;
149 * q.s.high = n.s.low;
150 * r.s.high = 0;
151 * r.s.low = n.s.high;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000152 * }
153 * else if (sr < n_uword_bits) // 2 <= sr <= n_uword_bits - 1
154 * {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000155 * q.s.low = 0;
156 * q.s.high = n.s.low << (n_uword_bits - sr);
157 * r.s.high = n.s.high >> sr;
158 * r.s.low = (n.s.high << (n_uword_bits - sr)) | (n.s.low >> sr);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000159 * }
160 * else // n_uword_bits + 1 <= sr <= n_udword_bits - 1
161 * {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000162 * q.s.low = n.s.low << (n_udword_bits - sr);
163 * q.s.high = (n.s.high << (n_udword_bits - sr)) |
164 * (n.s.low >> (sr - n_uword_bits));
165 * r.s.high = 0;
166 * r.s.low = n.s.high >> (sr - n_uword_bits);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000167 * }
168 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000169 q.s.low = (n.s.low << (n_udword_bits - sr)) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000170 ((si_int)(n_uword_bits - sr) >> (n_uword_bits-1));
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000171 q.s.high = ((n.s.low << ( n_uword_bits - sr)) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000172 ((si_int)(sr - n_uword_bits - 1) >> (n_uword_bits-1))) |
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000173 (((n.s.high << (n_udword_bits - sr)) |
174 (n.s.low >> (sr - n_uword_bits))) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000175 ((si_int)(n_uword_bits - sr) >> (n_uword_bits-1)));
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000176 r.s.high = (n.s.high >> sr) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000177 ((si_int)(sr - n_uword_bits) >> (n_uword_bits-1));
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000178 r.s.low = ((n.s.high >> (sr - n_uword_bits)) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000179 ((si_int)(n_uword_bits - sr - 1) >> (n_uword_bits-1))) |
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000180 (((n.s.high << (n_uword_bits - sr)) |
181 (n.s.low >> sr)) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000182 ((si_int)(sr - n_uword_bits) >> (n_uword_bits-1)));
183 }
184 else
185 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000186 /* K X
187 * ---
188 * K K
189 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000190 sr = __builtin_clz(d.s.high) - __builtin_clz(n.s.high);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000191 /* 0 <= sr <= n_uword_bits - 1 or sr large */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000192 if (sr > n_uword_bits - 1)
193 {
194 if (rem)
195 *rem = n.all;
196 return 0;
197 }
198 ++sr;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000199 /* 1 <= sr <= n_uword_bits */
200 /* q.all = n.all << (n_udword_bits - sr); */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000201 q.s.low = 0;
202 q.s.high = n.s.low << (n_uword_bits - sr);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000203 /* r.all = n.all >> sr;
204 * if (sr < n_uword_bits)
205 * {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000206 * r.s.high = n.s.high >> sr;
207 * r.s.low = (n.s.high << (n_uword_bits - sr)) | (n.s.low >> sr);
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000208 * }
209 * else
210 * {
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000211 * r.s.high = 0;
212 * r.s.low = n.s.high;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000213 * }
214 */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000215 r.s.high = (n.s.high >> sr) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000216 ((si_int)(sr - n_uword_bits) >> (n_uword_bits-1));
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000217 r.s.low = (n.s.high << (n_uword_bits - sr)) |
218 ((n.s.low >> sr) &
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000219 ((si_int)(sr - n_uword_bits) >> (n_uword_bits-1)));
220 }
221 }
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000222 /* Not a special case
223 * q and r are initialized with:
224 * q.all = n.all << (n_udword_bits - sr);
225 * r.all = n.all >> sr;
226 * 1 <= sr <= n_udword_bits - 1
227 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000228 su_int carry = 0;
229 for (; sr > 0; --sr)
230 {
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000231 /* r:q = ((r:q) << 1) | carry */
Edward O'Callaghan8bf1e092009-08-09 18:41:02 +0000232 r.s.high = (r.s.high << 1) | (r.s.low >> (n_uword_bits - 1));
233 r.s.low = (r.s.low << 1) | (q.s.high >> (n_uword_bits - 1));
234 q.s.high = (q.s.high << 1) | (q.s.low >> (n_uword_bits - 1));
235 q.s.low = (q.s.low << 1) | carry;
Edward O'Callaghan37a6a452009-08-07 20:30:09 +0000236 /* carry = 0;
237 * if (r.all >= d.all)
238 * {
239 * r.all -= d.all;
240 * carry = 1;
241 * }
242 */
Daniel Dunbarb3a69012009-06-26 16:47:03 +0000243 const di_int s = (di_int)(d.all - r.all - 1) >> (n_udword_bits - 1);
244 carry = s & 1;
245 r.all -= d.all & s;
246 }
247 q.all = (q.all << 1) | carry;
248 if (rem)
249 *rem = r.all;
250 return q.all;
251}