| /* longlong.h -- based on code from gcc-2.95.3 |
| |
| definitions for mixed size 32/64 bit arithmetic. |
| Copyright (C) 1991, 92, 94, 95, 96, 1997, 1998 Free Software Foundation, Inc. |
| |
| This definition file is free software; you can redistribute it |
| and/or modify it under the terms of the GNU General Public |
| License as published by the Free Software Foundation; either |
| version 2, or (at your option) any later version. |
| |
| This definition file is distributed in the hope that it will be |
| useful, but WITHOUT ANY WARRANTY; without even the implied |
| warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. |
| See the GNU General Public License for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with this program; if not, write to the Free Software |
| Foundation, Inc., 59 Temple Place - Suite 330, |
| Boston, MA 02111-1307, USA. */ |
| |
| /* Borrowed from GCC 2.95.3, I Molton 29/07/01 */ |
| |
| #ifndef SI_TYPE_SIZE |
| #define SI_TYPE_SIZE 32 |
| #endif |
| |
| #define __BITS4 (SI_TYPE_SIZE / 4) |
| #define __ll_B (1L << (SI_TYPE_SIZE / 2)) |
| #define __ll_lowpart(t) ((u32) (t) % __ll_B) |
| #define __ll_highpart(t) ((u32) (t) / __ll_B) |
| |
| /* Define auxiliary asm macros. |
| |
| 1) umul_ppmm(high_prod, low_prod, multipler, multiplicand) |
| multiplies two u32 integers MULTIPLER and MULTIPLICAND, |
| and generates a two-part u32 product in HIGH_PROD and |
| LOW_PROD. |
| |
| 2) __umulsidi3(a,b) multiplies two u32 integers A and B, |
| and returns a u64 product. This is just a variant of umul_ppmm. |
| |
| 3) udiv_qrnnd(quotient, remainder, high_numerator, low_numerator, |
| denominator) divides a two-word unsigned integer, composed by the |
| integers HIGH_NUMERATOR and LOW_NUMERATOR, by DENOMINATOR and |
| places the quotient in QUOTIENT and the remainder in REMAINDER. |
| HIGH_NUMERATOR must be less than DENOMINATOR for correct operation. |
| If, in addition, the most significant bit of DENOMINATOR must be 1, |
| then the pre-processor symbol UDIV_NEEDS_NORMALIZATION is defined to 1. |
| |
| 4) sdiv_qrnnd(quotient, remainder, high_numerator, low_numerator, |
| denominator). Like udiv_qrnnd but the numbers are signed. The |
| quotient is rounded towards 0. |
| |
| 5) count_leading_zeros(count, x) counts the number of zero-bits from |
| the msb to the first non-zero bit. This is the number of steps X |
| needs to be shifted left to set the msb. Undefined for X == 0. |
| |
| 6) add_ssaaaa(high_sum, low_sum, high_addend_1, low_addend_1, |
| high_addend_2, low_addend_2) adds two two-word unsigned integers, |
| composed by HIGH_ADDEND_1 and LOW_ADDEND_1, and HIGH_ADDEND_2 and |
| LOW_ADDEND_2 respectively. The result is placed in HIGH_SUM and |
| LOW_SUM. Overflow (i.e. carry out) is not stored anywhere, and is |
| lost. |
| |
| 7) sub_ddmmss(high_difference, low_difference, high_minuend, |
| low_minuend, high_subtrahend, low_subtrahend) subtracts two |
| two-word unsigned integers, composed by HIGH_MINUEND_1 and |
| LOW_MINUEND_1, and HIGH_SUBTRAHEND_2 and LOW_SUBTRAHEND_2 |
| respectively. The result is placed in HIGH_DIFFERENCE and |
| LOW_DIFFERENCE. Overflow (i.e. carry out) is not stored anywhere, |
| and is lost. |
| |
| If any of these macros are left undefined for a particular CPU, |
| C macros are used. */ |
| |
| #if defined (__arm__) |
| #define add_ssaaaa(sh, sl, ah, al, bh, bl) \ |
| __asm__ ("adds %1, %4, %5 \n\ |
| adc %0, %2, %3" \ |
| : "=r" ((u32) (sh)), \ |
| "=&r" ((u32) (sl)) \ |
| : "%r" ((u32) (ah)), \ |
| "rI" ((u32) (bh)), \ |
| "%r" ((u32) (al)), \ |
| "rI" ((u32) (bl))) |
| #define sub_ddmmss(sh, sl, ah, al, bh, bl) \ |
| __asm__ ("subs %1, %4, %5 \n\ |
| sbc %0, %2, %3" \ |
| : "=r" ((u32) (sh)), \ |
| "=&r" ((u32) (sl)) \ |
| : "r" ((u32) (ah)), \ |
| "rI" ((u32) (bh)), \ |
| "r" ((u32) (al)), \ |
| "rI" ((u32) (bl))) |
| #define umul_ppmm(xh, xl, a, b) \ |
| {register u32 __t0, __t1, __t2; \ |
| __asm__ ("%@ Inlined umul_ppmm \n\ |
| mov %2, %5, lsr #16 \n\ |
| mov %0, %6, lsr #16 \n\ |
| bic %3, %5, %2, lsl #16 \n\ |
| bic %4, %6, %0, lsl #16 \n\ |
| mul %1, %3, %4 \n\ |
| mul %4, %2, %4 \n\ |
| mul %3, %0, %3 \n\ |
| mul %0, %2, %0 \n\ |
| adds %3, %4, %3 \n\ |
| addcs %0, %0, #65536 \n\ |
| adds %1, %1, %3, lsl #16 \n\ |
| adc %0, %0, %3, lsr #16" \ |
| : "=&r" ((u32) (xh)), \ |
| "=r" ((u32) (xl)), \ |
| "=&r" (__t0), "=&r" (__t1), "=r" (__t2) \ |
| : "r" ((u32) (a)), \ |
| "r" ((u32) (b)));} |
| #define UMUL_TIME 20 |
| #define UDIV_TIME 100 |
| #endif /* __arm__ */ |
| |
| #define __umulsidi3(u, v) \ |
| ({DIunion __w; \ |
| umul_ppmm (__w.s.high, __w.s.low, u, v); \ |
| __w.ll; }) |
| |
| #define __udiv_qrnnd_c(q, r, n1, n0, d) \ |
| do { \ |
| u32 __d1, __d0, __q1, __q0; \ |
| u32 __r1, __r0, __m; \ |
| __d1 = __ll_highpart (d); \ |
| __d0 = __ll_lowpart (d); \ |
| \ |
| __r1 = (n1) % __d1; \ |
| __q1 = (n1) / __d1; \ |
| __m = (u32) __q1 * __d0; \ |
| __r1 = __r1 * __ll_B | __ll_highpart (n0); \ |
| if (__r1 < __m) \ |
| { \ |
| __q1--, __r1 += (d); \ |
| if (__r1 >= (d)) /* i.e. we didn't get carry when adding to __r1 */\ |
| if (__r1 < __m) \ |
| __q1--, __r1 += (d); \ |
| } \ |
| __r1 -= __m; \ |
| \ |
| __r0 = __r1 % __d1; \ |
| __q0 = __r1 / __d1; \ |
| __m = (u32) __q0 * __d0; \ |
| __r0 = __r0 * __ll_B | __ll_lowpart (n0); \ |
| if (__r0 < __m) \ |
| { \ |
| __q0--, __r0 += (d); \ |
| if (__r0 >= (d)) \ |
| if (__r0 < __m) \ |
| __q0--, __r0 += (d); \ |
| } \ |
| __r0 -= __m; \ |
| \ |
| (q) = (u32) __q1 * __ll_B | __q0; \ |
| (r) = __r0; \ |
| } while (0) |
| |
| #define UDIV_NEEDS_NORMALIZATION 1 |
| #define udiv_qrnnd __udiv_qrnnd_c |
| |
| #define count_leading_zeros(count, x) \ |
| do { \ |
| u32 __xr = (x); \ |
| u32 __a; \ |
| \ |
| if (SI_TYPE_SIZE <= 32) \ |
| { \ |
| __a = __xr < ((u32)1<<2*__BITS4) \ |
| ? (__xr < ((u32)1<<__BITS4) ? 0 : __BITS4) \ |
| : (__xr < ((u32)1<<3*__BITS4) ? 2*__BITS4 : 3*__BITS4); \ |
| } \ |
| else \ |
| { \ |
| for (__a = SI_TYPE_SIZE - 8; __a > 0; __a -= 8) \ |
| if (((__xr >> __a) & 0xff) != 0) \ |
| break; \ |
| } \ |
| \ |
| (count) = SI_TYPE_SIZE - (__clz_tab[__xr >> __a] + __a); \ |
| } while (0) |