/* Copyright (c) 2016-2018 Chung, Hyung-Hwan. All rights reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. THIS SOFTWARE IS PROVIDED BY THE AUTHOR "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "hcl-prv.h" #if (HCL_LIW_BITS == HCL_OOW_BITS) /* nothing special */ #elif (HCL_LIW_BITS == HCL_OOHW_BITS) # define MAKE_WORD(hw1,hw2) ((hcl_oow_t)(hw1) | (hcl_oow_t)(hw2) << HCL_LIW_BITS) #else # error UNSUPPORTED LIW BIT SIZE #endif #define IS_SIGN_DIFF(x,y) (((x) ^ (y)) < 0) /*#define IS_POW2(ui) (((ui) > 0) && (((ui) & (~(ui)+ 1)) == (ui)))*/ #define IS_POW2(ui) (((ui) > 0) && ((ui) & ((ui) - 1)) == 0) /* digit character array */ static char* _digitc_array[] = { "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ", "0123456789abcdefghijklmnopqrstuvwxyz" }; /* exponent table for pow2 between 1 and 32 inclusive. */ static hcl_uint8_t _exp_tab[32] = { 0, 1, 0, 2, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 5 }; static const hcl_uint8_t debruijn_32[32] = { 0, 1, 28, 2, 29, 14, 24, 3, 30, 22, 20, 15, 25, 17, 4, 8, 31, 27, 13, 23, 21, 19, 16, 7, 26, 12, 18, 6, 11, 5, 10, 9 }; static const hcl_uint8_t debruijn_64[64] = { 0, 1, 2, 53, 3, 7, 54, 27, 4, 38, 41, 8, 34, 55, 48, 28, 62, 5, 39, 46, 44, 42, 22, 9, 24, 35, 59, 56, 49, 18, 29, 11, 63, 52, 6, 26, 37, 40, 33, 47, 61, 45, 43, 21, 23, 58, 17, 10, 51, 25, 36, 32, 60, 20, 57, 16, 50, 31, 19, 15, 30, 14, 13, 12 }; #if defined(HCL_HAVE_UINT32_T) # define LOG2_FOR_POW2_32(x) (debruijn_32[(hcl_uint32_t)((hcl_uint32_t)(x) * 0x077CB531) >> 27]) #endif #if defined(HCL_HAVE_UINT64_T) # define LOG2_FOR_POW2_64(x) (debruijn_64[(hcl_uint64_t)((hcl_uint64_t)(x) * 0x022fdd63cc95386d) >> 58]) #endif #if defined(HCL_HAVE_UINT32_T) && (HCL_SIZEOF_OOW_T == HCL_SIZEOF_UINT32_T) # define LOG2_FOR_POW2(x) LOG2_FOR_POW2_32(x) #elif defined(HCL_HAVE_UINT64_T) && (HCL_SIZEOF_OOW_T == HCL_SIZEOF_UINT64_T) # define LOG2_FOR_POW2(x) LOG2_FOR_POW2_64(x) #else # define LOG2_FOR_POW2(x) hcl_get_pos_of_msb_set_pow2(x) #endif #if (HCL_SIZEOF_OOW_T == HCL_SIZEOF_INT) && defined(HCL_HAVE_BUILTIN_UADD_OVERFLOW) # define oow_add_overflow(a,b,c) __builtin_uadd_overflow(a,b,c) #elif (HCL_SIZEOF_OOW_T == HCL_SIZEOF_LONG) && defined(HCL_HAVE_BUILTIN_UADDL_OVERFLOW) # define oow_add_overflow(a,b,c) __builtin_uaddl_overflow(a,b,c) #elif (HCL_SIZEOF_OOW_T == HCL_SIZEOF_LONG_LONG) && defined(HCL_HAVE_BUILTIN_UADDLL_OVERFLOW) # define oow_add_overflow(a,b,c) __builtin_uaddll_overflow(a,b,c) #else static HCL_INLINE int oow_add_overflow (hcl_oow_t a, hcl_oow_t b, hcl_oow_t* c) { *c = a + b; return b > HCL_TYPE_MAX(hcl_oow_t) - a; } #endif #if (HCL_SIZEOF_OOW_T == HCL_SIZEOF_INT) && defined(HCL_HAVE_BUILTIN_UMUL_OVERFLOW) # define oow_mul_overflow(a,b,c) __builtin_umul_overflow(a,b,c) #elif (HCL_SIZEOF_OOW_T == HCL_SIZEOF_LONG) && defined(HCL_HAVE_BUILTIN_UMULL_OVERFLOW) # define oow_mul_overflow(a,b,c) __builtin_umull_overflow(a,b,c) #elif (HCL_SIZEOF_OOW_T == HCL_SIZEOF_LONG_LONG) && defined(HCL_HAVE_BUILTIN_UMULLL_OVERFLOW) # define oow_mul_overflow(a,b,c) __builtin_umulll_overflow(a,b,c) #else static HCL_INLINE int oow_mul_overflow (hcl_oow_t a, hcl_oow_t b, hcl_oow_t* c) { #if (HCL_SIZEOF_UINTMAX_T > HCL_SIZEOF_OOW_T) hcl_uintmax_t k; k = (hcl_uintmax_t)a * (hcl_uintmax_t)b; *c = (hcl_oow_t)k; return (k >> HCL_OOW_BITS) > 0; /*return k > HCL_TYPE_MAX(hcl_oow_t);*/ #else *c = a * b; return b != 0 && a > HCL_TYPE_MAX(hcl_oow_t) / b; /* works for unsigned types only */ #endif } #endif #if (HCL_SIZEOF_OOI_T == HCL_SIZEOF_INT) && defined(HCL_HAVE_BUILTIN_SMUL_OVERFLOW) # define shcli_mul_overflow(hcl,a,b,c) __builtin_smul_overflow(a,b,c) #elif (HCL_SIZEOF_OOI_T == HCL_SIZEOF_LONG) && defined(HCL_HAVE_BUILTIN_SMULL_OVERFLOW) # define shcli_mul_overflow(hcl,a,b,c) __builtin_smull_overflow(a,b,c) #elif (HCL_SIZEOF_OOI_T == HCL_SIZEOF_LONG_LONG) && defined(HCL_HAVE_BUILTIN_SMULLL_OVERFLOW) # define shcli_mul_overflow(hcl,a,b,c) __builtin_smulll_overflow(a,b,c) #else static HCL_INLINE int shcli_mul_overflow (hcl_t* hcl, hcl_ooi_t a, hcl_ooi_t b, hcl_ooi_t* c) { /* take note that this function is not supposed to handle * the whole hcl_ooi_t range. it handles the shcli subrange */ #if (HCL_SIZEOF_UINTMAX_T > HCL_SIZEOF_OOI_T) hcl_intmax_t k; HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(a)); HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(b)); k = (hcl_intmax_t)a * (hcl_intmax_t)b; *c = (hcl_ooi_t)k; return k > HCL_TYPE_MAX(hcl_ooi_t) || k < HCL_TYPE_MIN(hcl_ooi_t); #else hcl_ooi_t ua, ub; HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(a)); HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(b)); *c = a * b; ub = (b >= 0)? b: -b; ua = (a >= 0)? a: -a; /* though this fomula basically works for unsigned types in principle, * the values used here are all absolute values and they fall in * a safe range to apply this fomula. the safe range is guaranteed because * the sources are supposed to be shclis. */ return ub != 0 && ua > HCL_TYPE_MAX(hcl_ooi_t) / ub; #endif } #endif #if (HCL_SIZEOF_LIW_T == HCL_SIZEOF_INT) && defined(HCL_HAVE_BUILTIN_UADD_OVERFLOW) # define liw_add_overflow(a,b,c) __builtin_uadd_overflow(a,b,c) #elif (HCL_SIZEOF_LIW_T == HCL_SIZEOF_LONG) && defined(HCL_HAVE_BUILTIN_UADDL_OVERFLOW) # define liw_add_overflow(a,b,c) __builtin_uaddl_overflow(a,b,c) #elif (HCL_SIZEOF_LIW_T == HCL_SIZEOF_LONG_LONG) && defined(HCL_HAVE_BUILTIN_UADDLL_OVERFLOW) # define liw_add_overflow(a,b,c) __builtin_uaddll_overflow(a,b,c) #else static HCL_INLINE int liw_add_overflow (hcl_liw_t a, hcl_liw_t b, hcl_liw_t* c) { *c = a + b; return b > HCL_TYPE_MAX(hcl_liw_t) - a; } #endif #if (HCL_SIZEOF_LIW_T == HCL_SIZEOF_INT) && defined(HCL_HAVE_BUILTIN_UMUL_OVERFLOW) # define liw_mul_overflow(a,b,c) __builtin_umul_overflow(a,b,c) #elif (HCL_SIZEOF_LIW_T == HCL_SIZEOF_LONG) && defined(HCL_HAVE_BUILTIN_UMULL_OVERFLOW) # define liw_mul_overflow(a,b,c) __builtin_uaddl_overflow(a,b,c) #elif (HCL_SIZEOF_LIW_T == HCL_SIZEOF_LONG_LONG) && defined(HCL_HAVE_BUILTIN_UMULLL_OVERFLOW) # define liw_mul_overflow(a,b,c) __builtin_uaddll_overflow(a,b,c) #else static HCL_INLINE int liw_mul_overflow (hcl_liw_t a, hcl_liw_t b, hcl_liw_t* c) { #if (HCL_SIZEOF_UINTMAX_T > HCL_SIZEOF_LIW_T) hcl_uintmax_t k; k = (hcl_uintmax_t)a * (hcl_uintmax_t)b; *c = (hcl_liw_t)k; return (k >> HCL_LIW_BITS) > 0; /*return k > HCL_TYPE_MAX(hcl_liw_t);*/ #else *c = a * b; return b != 0 && a > HCL_TYPE_MAX(hcl_liw_t) / b; /* works for unsigned types only */ #endif } #endif static int is_normalized_integer (hcl_t* hcl, hcl_oop_t oop) { if (HCL_OOP_IS_SMOOI(oop)) return 1; if (HCL_IS_BIGINT(hcl,oop)) { hcl_oow_t sz; sz = HCL_OBJ_GET_SIZE(oop); HCL_ASSERT (hcl, sz >= 1); return HCL_OBJ_GET_LIWORD_VAL(oop, sz - 1) != 0; } return 0; } static HCL_INLINE int bigint_to_oow_noseterr (hcl_t* hcl, hcl_oop_t num, hcl_oow_t* w) { HCL_ASSERT (hcl, HCL_IS_BIGINT(hcl,num)); #if (HCL_LIW_BITS == HCL_OOW_BITS) HCL_ASSERT (hcl, HCL_OBJ_GET_SIZE(num) >= 1); if (HCL_OBJ_GET_SIZE(num) == 1) { *w = HCL_OBJ_GET_WORD_VAL(num, 0); return HCL_IS_NBIGINT(hcl,num)? -1: 1; } #elif (HCL_LIW_BITS == HCL_OOHW_BITS) /* this function must be called with a real large integer. * a real large integer is at least 2 half-word long. * you must not call this function with an unnormalized * large integer. */ HCL_ASSERT (hcl, HCL_OBJ_GET_SIZE(num) >= 2); if (HCL_OBJ_GET_SIZE(num) == 2) { *w = MAKE_WORD(HCL_OBJ_GET_HALFWORD_VAL(num, 0), HCL_OBJ_GET_HALFWORD_VAL(num, 1)); return HCL_IS_NBIGINT(hcl,num)? -1: 1; } #else # error UNSUPPORTED LIW BIT SIZE #endif return 0; /* not convertable */ } static HCL_INLINE int integer_to_oow_noseterr (hcl_t* hcl, hcl_oop_t x, hcl_oow_t* w) { /* return value * 1 - a positive number including 0 that can fit into hcl_oow_t * -1 - a negative number whose absolute value can fit into hcl_oow_t * 0 - number too large or too small */ if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); if (v < 0) { *w = -v; return -1; } else { *w = v; return 1; } } HCL_ASSERT (hcl, hcl_isbigint(hcl, x)); return bigint_to_oow_noseterr(hcl, x, w); } int hcl_inttooow_noseterr (hcl_t* hcl, hcl_oop_t x, hcl_oow_t* w) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); if (v < 0) { *w = -v; return -1; /* negative number negated - kind of an error */ } else { *w = v; return 1; /* zero or positive number */ } } /* 0 -> too big, too small, or not an integer */ return hcl_isbigint(hcl, x)? bigint_to_oow_noseterr(hcl, x, w): 0; } int hcl_inttooow (hcl_t* hcl, hcl_oop_t x, hcl_oow_t* w) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); if (v < 0) { *w = -v; hcl_seterrnum (hcl, HCL_ERANGE); return -1; /* negative number negated - kind of an error */ } else { *w = v; return 1; /* zero or positive number */ } } if (hcl_isbigint(hcl, x)) { int n; if ((n = bigint_to_oow_noseterr(hcl, x, w)) <= 0) hcl_seterrnum (hcl, HCL_ERANGE); return n; } hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O", x); return 0; /* not convertable - too big, too small, or not integer */ } int hcl_inttoooi_noseterr (hcl_t* hcl, hcl_oop_t x, hcl_ooi_t* i) { if (HCL_OOP_IS_SMOOI(x)) { *i = HCL_OOP_TO_SMOOI(x); return (*i < 0)? -1: 1; } if (hcl_isbigint(hcl, x)) { hcl_oow_t w; int n; n = bigint_to_oow_noseterr(hcl, x, &w); if (n < 0) { HCL_STATIC_ASSERT (HCL_TYPE_MAX(hcl_ooi_t) + HCL_TYPE_MIN(hcl_ooi_t) == -1); /* assume 2's complement */ if (w > (hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1) return 0; /* too small */ *i = -w; /* negate back */ } else if (n > 0) { if (w > HCL_TYPE_MAX(hcl_ooi_t)) return 0; /* too big */ *i = w; } return n; } return 0; /* not integer */ } int hcl_inttoooi (hcl_t* hcl, hcl_oop_t x, hcl_ooi_t* i) { if (HCL_OOP_IS_SMOOI(x)) { *i = HCL_OOP_TO_SMOOI(x); return (*i < 0)? -1: 1; } if (hcl_isbigint(hcl, x)) { hcl_oow_t w; int n; n = bigint_to_oow_noseterr(hcl, x, &w); if (n < 0) { HCL_STATIC_ASSERT (HCL_TYPE_MAX(hcl_ooi_t) + HCL_TYPE_MIN(hcl_ooi_t) == -1); /* assume 2's complement */ if (w > (hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1) { hcl_seterrnum (hcl, HCL_ERANGE); return 0; /* too small */ } *i = -w; /* negate back */ } else if (n > 0) { if (w > HCL_TYPE_MAX(hcl_ooi_t)) { hcl_seterrnum (hcl, HCL_ERANGE); return 0; /* too big */ } *i = w; } else { hcl_seterrnum (hcl, HCL_ERANGE); } return n; } hcl_seterrbfmt (hcl, HCL_EINVAL, "not an integer - %O", x); return 0; /* not integer */ } #if (HCL_SIZEOF_UINTMAX_T == HCL_SIZEOF_OOW_T) /* do nothing. required macros are defined in hcl.h */ #elif (HCL_SIZEOF_UINTMAX_T == HCL_SIZEOF_OOW_T * 2) static HCL_INLINE int bigint_to_uintmax (hcl_t* hcl, hcl_oop_t num, hcl_uintmax_t* w) { HCL_ASSERT (hcl, HCL_OOP_IS_POINTER(num)); HCL_ASSERT (hcl, HCL_IS_PBIGINT(hcl, num) || HCL_IS_NBIGINT(hcl, num)); #if (HCL_LIW_BITS == HCL_OOW_BITS) HCL_ASSERT (hcl, HCL_OBJ_GET_SIZE(num) >= 1); switch (HCL_OBJ_GET_SIZE(num)) { case 1: *w = (hcl_uintmax_t)HCL_OBJ_GET_WORD_VAL(num, 0); goto done; case 2: *w = ((hcl_uintmax_t)HCL_OBJ_GET_WORD_VAL(num, 0) << HCL_LIW_BITS) | HCL_OBJ_GET_WORD_VAL(num, 1); goto done; default: goto oops_range; } #elif (HCL_LIW_BITS == HCL_OOHW_BITS) HCL_ASSERT (hcl, HCL_OBJ_GET_SIZE(num) >= 2); switch (HCL_OBJ_GET_SIZE(num)) { case 2: *w = ((hcl_uintmax_t)HCL_OBJ_GET_HALFWORD_VAL(num, 0) << HCL_LIW_BITS) | HCL_OBJ_GET_HALFWORD_VAL(num, 1); goto done; case 4: *w = ((hcl_uintmax_t)HCL_OBJ_GET_HALFWORD_VAL(num, 0) << HCL_LIW_BITS * 3) | ((hcl_uintmax_t)HCL_OBJ_GET_HALFWORD_VAL(num, 1) << HCL_LIW_BITS * 2) | ((hcl_uintmax_t)HCL_OBJ_GET_HALFWORD_VAL(num, 2) << HCL_LIW_BITS * 1) | HCL_OBJ_GET_HALFWORD_VAL(num, 3); goto done; default: goto oops_range; } #else # error UNSUPPORTED LIW BIT SIZE #endif done: return (HCL_IS_NBIGINT(hcl, num))? -1: 1; oops_range: hcl_seterrnum (hcl, HCL_ERANGE); return 0; /* not convertable */ } int hcl_inttouintmax (hcl_t* hcl, hcl_oop_t x, hcl_uintmax_t* w) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); if (v < 0) { *w = -v; return -1; /* negative number negated - kind of an error */ } else { *w = v; return 1; /* zero or positive number */ } } if (hcl_isbigint(hcl, x)) return bigint_to_uintmax(hcl, x, w); hcl_seterrbfmt (hcl, HCL_EINVAL, "not an integer - %O", x); return 0; /* not convertable - too big, too small, or not an integer */ } int hcl_inttointmax (hcl_t* hcl, hcl_oop_t x, hcl_intmax_t* i) { hcl_uintmax_t w; int n; n = hcl_inttouintmax(hcl, x, &w); if (n < 0) { HCL_STATIC_ASSERT (HCL_TYPE_MAX(hcl_intmax_t) + HCL_TYPE_MIN(hcl_intmax_t) == -1); /* assume 2's complement */ if (w > (hcl_uintmax_t)HCL_TYPE_MAX(hcl_intmax_t) + 1) { hcl_seterrnum (hcl, HCL_ERANGE); /* not convertable. number too small */ return 0; } *i = -w; } else if (n > 0) { if (w > HCL_TYPE_MAX(hcl_intmax_t)) { hcl_seterrnum (hcl, HCL_ERANGE); /* not convertable. number too big */ return 0; } *i = w; } return n; } #else # error UNSUPPORTED UINTMAX SIZE #endif static HCL_INLINE hcl_oop_t make_bigint_with_oow (hcl_t* hcl, hcl_oow_t w) { #if (HCL_LIW_BITS == HCL_OOW_BITS) HCL_ASSERT (hcl, HCL_SIZEOF(hcl_oow_t) == HCL_SIZEOF(hcl_liw_t)); return hcl_makebigint(hcl, HCL_BRAND_PBIGINT, &w, 1); #elif (HCL_LIW_BITS == HCL_OOHW_BITS) hcl_liw_t hw[2]; hw[0] = w /*& HCL_LBMASK(hcl_oow_t,HCL_LIW_BITS)*/; hw[1] = w >> HCL_LIW_BITS; return hcl_makebigint(hcl, HCL_BRAND_PBIGINT, hw, (hw[1] > 0? 2: 1)); #else # error UNSUPPORTED LIW BIT SIZE #endif } static HCL_INLINE hcl_oop_t make_bigint_with_ooi (hcl_t* hcl, hcl_ooi_t i) { #if (HCL_LIW_BITS == HCL_OOW_BITS) hcl_oow_t w; HCL_STATIC_ASSERT (hcl, HCL_SIZEOF(hcl_oow_t) == HCL_SIZEOF(hcl_liw_t)); if (i >= 0) { w = i; return hcl_makebigint(hcl, HCL_BRAND_PBIGINT, &w, 1); } else { w = (i == HCL_TYPE_MIN(hcl_ooi_t))? ((hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1): -i; return hcl_makebigint(hcl, HCL_BRAND_NBIGINT, &w, 1); } #elif (HCL_LIW_BITS == HCL_OOHW_BITS) hcl_liw_t hw[2]; hcl_oow_t w; HCL_STATIC_ASSERT (HCL_SIZEOF(hcl_oohw_t) == HCL_SIZEOF(hcl_liw_t)); if (i >= 0) { w = i; hw[0] = w /*& HCL_LBMASK(hcl_oow_t,HCL_LIW_BITS)*/; hw[1] = w >> HCL_LIW_BITS; return hcl_makebigint(hcl, HCL_BRAND_PBIGINT, hw, (hw[1] > 0? 2: 1)); } else { w = -i; w = (i == HCL_TYPE_MIN(hcl_ooi_t))? ((hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1): -i; hw[0] = w /*& HCL_LBMASK(hcl_oow_t,HCL_LIW_BITS)*/; hw[1] = w >> HCL_LIW_BITS; return hcl_makebigint(hcl, HCL_BRAND_NBIGINT, hw, (hw[1] > 0? 2: 1)); } #else # error UNSUPPORTED LIW BIT SIZE #endif } static HCL_INLINE hcl_oop_t make_bloated_bigint_with_ooi (hcl_t* hcl, hcl_ooi_t i, hcl_oow_t extra) { #if (HCL_LIW_BITS == HCL_OOW_BITS) hcl_oow_t w; hcl_oop_t z; HCL_ASSERT (hcl, extra <= HCL_OBJ_SIZE_MAX - 1); HCL_STATIC_ASSERT (hcl, HCL_SIZEOF(hcl_oow_t) == HCL_SIZEOF(hcl_liw_t)); if (i >= 0) { w = i; z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, 1 + extra); } else { w = (i == HCL_TYPE_MIN(hcl_ooi_t))? ((hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1): -i; z = hcl_makebigint(hcl, HCL_BRAND_NBIGINT, HCL_NULL, 1 + extra); } if (!z) return HCL_NULL; HCL_OBJ_SET_LIWORD_VAL (z, 0, w); return z; #elif (HCL_LIW_BITS == HCL_OOHW_BITS) hcl_liw_t hw[2]; hcl_oow_t w; hcl_oop_t z; HCL_ASSERT (hcl, extra <= HCL_OBJ_SIZE_MAX - 2); if (i >= 0) { w = i; hw[0] = w /*& HCL_LBMASK(hcl_oow_t,HCL_LIW_BITS)*/; hw[1] = w >> HCL_LIW_BITS; z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, (hw[1] > 0? 2: 1) + extra); } else { w = (i == HCL_TYPE_MIN(hcl_ooi_t))? ((hcl_oow_t)HCL_TYPE_MAX(hcl_ooi_t) + 1): -i; hw[0] = w /*& HCL_LBMASK(hcl_oow_t,HCL_LIW_BITS)*/; hw[1] = w >> HCL_LIW_BITS; z = hcl_makebigint(hcl, HCL_BRAND_NBIGINT, HCL_NULL, (hw[1] > 0? 2: 1) + extra); } if (!z) return HCL_NULL; HCL_OBJ_SET_LIWORD_VAL (z, 0, hw[0]); if (hw[1] > 0) HCL_OBJ_SET_LIWORD_VAL (z, 1, hw[1]); return z; #else # error UNSUPPORTED LIW BIT SIZE #endif } static HCL_INLINE hcl_oop_t make_bigint_with_intmax (hcl_t* hcl, hcl_intmax_t v) { hcl_oow_t len; hcl_liw_t buf[HCL_SIZEOF_INTMAX_T / HCL_SIZEOF_LIW_T]; hcl_uintmax_t ui; int brand; /* this is not a generic function. it can't handle v * if it's HCL_TYPE_MIN(hcl_intmax_t) */ HCL_ASSERT (hcl, v > HCL_TYPE_MIN(hcl_intmax_t)); if (v >= 0) { ui = v; brand = HCL_BRAND_PBIGINT; } else { ui = (v == HCL_TYPE_MIN(hcl_intmax_t))? ((hcl_uintmax_t)HCL_TYPE_MAX(hcl_intmax_t) + 1): -v; brand = HCL_BRAND_NBIGINT; } len = 0; do { buf[len++] = (hcl_liw_t)ui; ui = ui >> HCL_LIW_BITS; } while (ui > 0); return hcl_makebigint(hcl, brand, buf, len); } static HCL_INLINE hcl_oop_t make_bigint_with_uintmax (hcl_t* hcl, hcl_uintmax_t ui) { hcl_oow_t len; hcl_liw_t buf[HCL_SIZEOF_INTMAX_T / HCL_SIZEOF_LIW_T]; len = 0; do { buf[len++] = (hcl_liw_t)ui; ui = ui >> HCL_LIW_BITS; } while (ui > 0); return hcl_makebigint(hcl, HCL_BRAND_PBIGINT, buf, len); } hcl_oop_t hcl_oowtoint (hcl_t* hcl, hcl_oow_t w) { HCL_ASSERT (hcl, HCL_TYPE_IS_UNSIGNED(hcl_oow_t)); /*if (HCL_IN_SMOOI_RANGE(w))*/ if (w <= HCL_SMOOI_MAX) { return HCL_SMOOI_TO_OOP(w); } else { return make_bigint_with_oow(hcl, w); } } hcl_oop_t hcl_ooitoint (hcl_t* hcl, hcl_ooi_t i) { if (HCL_IN_SMOOI_RANGE(i)) { return HCL_SMOOI_TO_OOP(i); } else { return make_bigint_with_ooi (hcl, i); } } #if (HCL_SIZEOF_UINTMAX_T == HCL_SIZEOF_OOW_T) /* do nothing. required macros are defined in hcl.h */ #else hcl_oop_t hcl_intmaxtoint (hcl_t* hcl, hcl_intmax_t i) { if (HCL_IN_SMOOI_RANGE(i)) { return HCL_SMOOI_TO_OOP(i); } else { return make_bigint_with_intmax(hcl, i); } } hcl_oop_t hcl_uintmaxtoint (hcl_t* hcl, hcl_uintmax_t i) { if (HCL_IN_SMOOI_RANGE(i)) { return HCL_SMOOI_TO_OOP(i); } else { return make_bigint_with_uintmax(hcl, i); } } #endif static HCL_INLINE hcl_oop_t expand_bigint (hcl_t* hcl, hcl_oop_t oop, hcl_oow_t inc) { hcl_oop_t z; hcl_oow_t i; hcl_oow_t count; HCL_ASSERT (hcl, HCL_OOP_IS_POINTER(oop)); count = HCL_OBJ_GET_SIZE(oop); if (inc > HCL_OBJ_SIZE_MAX - count) { hcl_seterrnum (hcl, HCL_EOOMEM); /* TODO: is it a soft failure or a hard failure? is this error code proper? */ return HCL_NULL; } hcl_pushvolat (hcl, &oop); z = hcl_makebigint(hcl, HCL_OBJ_GET_FLAGS_BRAND(oop), HCL_NULL, count + inc); hcl_popvolat (hcl); if (!z) return HCL_NULL; for (i = 0; i < count; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)oop)->slot[i]; } return z; } static HCL_INLINE hcl_oop_t _clone_bigint (hcl_t* hcl, hcl_oop_t oop, hcl_oow_t count, int brand) { hcl_oop_t z; hcl_oow_t i; HCL_ASSERT (hcl, HCL_OOP_IS_POINTER(oop)); if (count <= 0) count = HCL_OBJ_GET_SIZE(oop); hcl_pushvolat (hcl, &oop); z = hcl_makebigint(hcl, brand, HCL_NULL, count); hcl_popvolat (hcl); if (!z) return HCL_NULL; for (i = 0; i < count; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)oop)->slot[i]; } return z; } static HCL_INLINE hcl_oop_t clone_bigint (hcl_t* hcl, hcl_oop_t oop, hcl_oow_t count) { return _clone_bigint (hcl, oop, count, HCL_OBJ_GET_FLAGS_BRAND(oop)); } static HCL_INLINE hcl_oop_t clone_bigint_negated (hcl_t* hcl, hcl_oop_t oop, hcl_oow_t count) { int brand; HCL_ASSERT (hcl, HCL_IS_BIGINT(hcl,oop)); if (HCL_IS_PBIGINT(hcl, oop)) { brand = HCL_BRAND_NBIGINT; } else { HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, oop)); brand = HCL_BRAND_PBIGINT; } return _clone_bigint (hcl, oop, count, brand); } static HCL_INLINE hcl_oop_t clone_bigint_to_positive (hcl_t* hcl, hcl_oop_t oop, hcl_oow_t count) { return _clone_bigint (hcl, oop, count, HCL_BRAND_PBIGINT); } static HCL_INLINE hcl_oow_t count_effective (hcl_liw_t* x, hcl_oow_t xs) { #if 0 while (xs > 1 && x[xs - 1] == 0) xs--; return xs; #else while (xs > 1) { if (x[--xs]) return xs + 1; } return 1; #endif } static HCL_INLINE hcl_oow_t count_effective_digits (hcl_oop_t oop) { hcl_oow_t i; for (i = HCL_OBJ_GET_SIZE(oop); i > 1; ) { --i; if (((hcl_oop_liword_t)oop)->slot[i]) return i + 1; } return 1; } static hcl_oop_t normalize_bigint (hcl_t* hcl, hcl_oop_t oop) { hcl_oow_t count; HCL_ASSERT (hcl, HCL_OOP_IS_POINTER(oop)); count = count_effective_digits (oop); #if (HCL_LIW_BITS == HCL_OOW_BITS) if (count == 1) /* 1 word */ { hcl_oow_t w; w = ((hcl_oop_liword_t)oop)->slot[0]; if (HCL_IS_PBIGINT(hcl, oop)) { if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP(w); } else { HCL_ASSERT (hcl, -HCL_SMOOI_MAX == HCL_SMOOI_MIN); HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, oop)); if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP(-(hcl_ooi_t)w); } } #elif (HCL_LIW_BITS == HCL_OOHW_BITS) if (count == 1) /* 1 half-word */ { if (HCL_IS_PBIGINT(hcl, oop)) { return HCL_SMOOI_TO_OOP(((hcl_oop_liword_t)oop)->slot[0]); } else { HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, oop)); return HCL_SMOOI_TO_OOP(-(hcl_ooi_t)((hcl_oop_liword_t)oop)->slot[0]); } } else if (count == 2) /* 2 half-words */ { hcl_oow_t w; w = MAKE_WORD(((hcl_oop_liword_t)oop)->slot[0], ((hcl_oop_liword_t)oop)->slot[1]); if (HCL_IS_PBIGINT(hcl, oop)) { if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP(w); } else { HCL_ASSERT (hcl, -HCL_SMOOI_MAX == HCL_SMOOI_MIN); HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, oop)); if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP(-(hcl_ooi_t)w); } } #else # error UNSUPPORTED LIW BIT SIZE #endif if (HCL_OBJ_GET_SIZE(oop) == count) { /* no compaction is needed. return it as it is */ return oop; } return clone_bigint (hcl, oop, count); } static HCL_INLINE int is_less_unsigned_array (const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys) { hcl_oow_t i; if (xs != ys) return xs < ys; for (i = xs; i > 0; ) { --i; if (x[i] != y[i]) return x[i] < y[i]; } return 0; } static HCL_INLINE int is_less_unsigned (hcl_oop_t x, hcl_oop_t y) { return is_less_unsigned_array ( ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y)); } static HCL_INLINE int is_less (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OBJ_GET_FLAGS_BRAND(x) != HCL_OBJ_GET_FLAGS_BRAND(y)) { return HCL_IS_NBIGINT(hcl, x); } if (HCL_IS_PBIGINT(hcl, x)) { return is_less_unsigned (x, y); } else { return is_less_unsigned (y, x); } } static HCL_INLINE int is_greater_unsigned_array (const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys) { hcl_oow_t i; if (xs != ys) return xs > ys; for (i = xs; i > 0; ) { --i; if (x[i] != y[i]) return x[i] > y[i]; } return 0; } static HCL_INLINE int is_greater_unsigned (hcl_oop_t x, hcl_oop_t y) { return is_greater_unsigned_array ( ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y)); } static HCL_INLINE int is_greater (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OBJ_GET_FLAGS_BRAND(x) != HCL_OBJ_GET_FLAGS_BRAND(y)) { return HCL_IS_NBIGINT(hcl, y); } if (HCL_IS_PBIGINT(hcl, x)) { return is_greater_unsigned (x, y); } else { return is_greater_unsigned (y, x); } } static HCL_INLINE int is_equal_unsigned_array (const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys) { return xs == ys && HCL_MEMCMP(x, y, xs * HCL_SIZEOF(*x)) == 0; } static HCL_INLINE int is_equal_unsigned (hcl_oop_t x, hcl_oop_t y) { return is_equal_unsigned_array( ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y)); } static HCL_INLINE int is_equal (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { /* check if two large integers are equal to each other */ /*return HCL_OBJ_GET_FLAGS_BRAND(x) == HCL_OBJ_GET_FLAGS_BRAND(y) && HCL_OBJ_GET_SIZE(x) == HCL_OBJ_GET_SIZE(y) && HCL_MEMCMP(((hcl_oop_liword_t)x)->slot, ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(x) * HCL_SIZEOF(hcl_liw_t)) == 0;*/ return HCL_OBJ_GET_FLAGS_BRAND(x) == HCL_OBJ_GET_FLAGS_BRAND(y) && HCL_OBJ_GET_SIZE(x) == HCL_OBJ_GET_SIZE(y) && is_equal_unsigned(x, y); } static void complement2_unsigned_array (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, hcl_liw_t* z) { hcl_oow_t i; hcl_lidw_t w; hcl_lidw_t carry; /* get 2's complement (~x + 1) */ carry = 1; for (i = 0; i < xs; i++) { w = (hcl_lidw_t)(~x[i]) + carry; /*w = (hcl_lidw_t)(x[i] ^ (~(hcl_liw_t)0)) + carry;*/ carry = w >> HCL_LIW_BITS; z[i] = w; } /* if the array pointed to by x contains all zeros, carry will be * 1 here and it actually requires 1 more slot. Let't take this 8-bit * zero for instance: * 2r00000000 -> 2r11111111 + 1 => 2r0000000100000000 * * this function is not designed to handle such a case. * in fact, 0 is a small integer and it must not stand a change * to be given to this function */ HCL_ASSERT (hcl, carry == 0); } static HCL_INLINE hcl_oow_t add_unsigned_array (const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* z) { #if 1 register hcl_oow_t i; hcl_lidw_t w; if (xs < ys) { /* swap x and y */ i = xs; xs = ys; ys = i; i = (hcl_oow_t)x; x = y; y = (hcl_liw_t*)i; } w = 0; i = 0; while (i < ys) { w += (hcl_lidw_t)x[i] + (hcl_lidw_t)y[i]; z[i++] = w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS); w >>= HCL_LIW_BITS; } while (w && i < xs) { w += x[i]; z[i++] = w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS); w >>= HCL_LIW_BITS; } while (i < xs) { z[i] = x[i]; i++; } if (w) z[i++] = w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS); return i; #else register hcl_oow_t i; hcl_lidw_t w; hcl_liw_t carry = 0; if (xs < ys) { /* swap x and y */ i = xs; xs = ys; ys = i; i = (hcl_oow_t)x; x = y; y = (hcl_liw_t*)i; } for (i = 0; i < ys; i++) { w = (hcl_lidw_t)x[i] + (hcl_lidw_t)y[i] + carry; carry = w >> HCL_LIW_BITS; z[i] = w /*& HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS) */; } if (x == z) { for (; carry && i < xs; i++) { w = (hcl_lidw_t)x[i] + carry; carry = w >> HCL_LIW_BITS; z[i] = w /*& HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS) */; } i = xs; } else { for (; i < xs; i++) { w = (hcl_lidw_t)x[i] + carry; carry = w >> HCL_LIW_BITS; z[i] = w /*& HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS)*/; } } if (carry) z[i++] = carry; return i; /* the number of effective digits in the result */ #endif } static HCL_INLINE hcl_oow_t subtract_unsigned_array (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* z) { #if 1 hcl_oow_t i; hcl_lidi_t w = 0; if (x == y) { HCL_ASSERT (hcl, xs == ys); z[0] = 0; return 1; } HCL_ASSERT (hcl, !is_less_unsigned_array(x, xs, y, ys)); for (i = 0; i < ys; i++) { w += (hcl_lidi_t)x[i] - (hcl_lidi_t)y[i]; z[i] = w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS); w >>= HCL_LIW_BITS; } while (w && i < xs) { w += x[i]; z[i++] = w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS); w >>= HCL_LIW_BITS; } while (i < xs) { z[i] = x[i]; i++; } while (i > 1 && z[i - 1] == 0) i--; return i; #else hcl_oow_t i; hcl_lidw_t w; hcl_lidw_t borrow = 0; hcl_lidw_t borrowed_word; if (x == y) { HCL_ASSERT (hcl, xs == ys); z[0] = 0; return 1; } HCL_ASSERT (hcl, !is_less_unsigned_array(x, xs, y, ys)); borrowed_word = (hcl_lidw_t)1 << HCL_LIW_BITS; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)y[i] + borrow; if ((hcl_lidw_t)x[i] >= w) { z[i] = x[i] - w; borrow = 0; } else { z[i] = (borrowed_word + (hcl_lidw_t)x[i]) - w; borrow = 1; } } for (; i < xs; i++) { if (x[i] >= borrow) { z[i] = x[i] - (hcl_liw_t)borrow; borrow = 0; } else { z[i] = (borrowed_word + (hcl_lidw_t)x[i]) - borrow; borrow = 1; } } HCL_ASSERT (hcl, borrow == 0); while (i > 1 && z[i - 1] == 0) i--; return i; /* the number of effective digits in the result */ #endif } static HCL_INLINE void multiply_unsigned_array (const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* z) { hcl_lidw_t v; hcl_oow_t pa; if (xs < ys) { hcl_oow_t i; /* swap x and y */ i = xs; xs = ys; ys = i; i = (hcl_oow_t)x; x = y; y = (hcl_liw_t*)i; } if (ys == 1) { hcl_lidw_t dw; hcl_liw_t carry = 0; hcl_oow_t i; for (i = 0; i < xs; i++) { dw = ((hcl_lidw_t)x[i] * y[0]) + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); z[i] = (hcl_liw_t)dw; } z[i] = carry; return; } pa = xs; if (pa <= ((hcl_oow_t)1 << (HCL_LIDW_BITS - (HCL_LIW_BITS * 2)))) { /* Comba(column-array) multiplication */ /* when the input length is too long, v may overflow. if it * happens, comba's method doesn't work as carry propagation is * affected badly. so we need to use this method only if * the input is short enough. */ hcl_oow_t pa, ix, iy, iz, tx, ty; pa = xs + ys; v = 0; for (ix = 0; ix < pa; ix++) { ty = (ix < ys - 1)? ix: (ys - 1); tx = ix - ty; iy = (ty + 1 < xs - tx)? (ty + 1): (xs - tx); for (iz = 0; iz < iy; iz++) { v = v + (hcl_lidw_t)x[tx + iz] * (hcl_lidw_t)y[ty - iz]; } z[ix] = (hcl_liw_t)v; v = v >> HCL_LIW_BITS; } } else { hcl_oow_t i, j; hcl_liw_t carry; for (i = 0; i < xs; i++) { if (x[i] == 0) { z[i + ys] = 0; } else { carry = 0; for (j = 0; j < ys; j++) { v = (hcl_lidw_t)x[i] * (hcl_lidw_t)y[j] + (hcl_lidw_t)carry + (hcl_lidw_t)z[i + j]; z[i + j] = (hcl_liw_t)v; carry = (hcl_liw_t)(v >> HCL_LIW_BITS); } z[i + j] = carry; } } } } /* KARATSUBA MULTIPLICATION * * c = |a| * |b| * * Let B represent the radix(2^DIGIT_BITS) * Let n represent half the number of digits * * a = a1 * B^n + a0 * b = b1 * B^n + b0 * a * b => a1b1 * B^2n + ((a1 + a0)(b1 + b0) - (a0b0 + a1b1)) * B^n + a0b0 * * -------------------------------------------------------------------- * For example, for 2 number 0xFAC2 and 0xABCD => A848635A * DIGIT_BITS = 8 (1 byte, each digit is 1 byte long) * B = 2^8 = 0x100 * n = 1 (half the digits of 2 digit numbers) * B^n = 0x100 ^ 1 = 0x100 * B^2n = 0x100 ^ 2 = 0x10000 * 0xFAC2 = 0xFA * 0x100 + 0xC2 * 0xABCD = 0xAB * 0x100 + 0xCD * a1 = 0xFA, a0 = 0xC2 * b1 = 0xAB, b0 = 0xCD * a1b1 = 0xFA * 0xAB = 0xA6FE * a0b0 = 0xC2 * 0xCD = 0x9B5A * a1 + a0 = 0xFA + 0xC2 = 0x1BC * b1 + b0 = 0xAB + 0xCD = 0x178 * -------------------------------------------------------------------- * (A6FE * 10000) + (((1BC * 178) - (985A + A6FE)) * 100) + 9B5A = * (A6FE << (8 * 2)) + (((1BC * 178) - (985A + A6FE)) << (8 * 1)) = * A6FE0000 + 14CC800 + 9B5A = 9848635A * -------------------------------------------------------------------- * * 0xABCD9876 * 0xEFEFABAB => 0xA105C97C9755A8D2 * B = 2^8 = 0x100 * n = 2 * B^n = 0x100 ^ 2 = 0x10000 * B^2n = 0x100 ^ 4 = 0x100000000 * 0xABCD9876 = 0xABCD * 0x10000 + 0x9876 * 0xEFEFABAB = 0xEFEF * 0x10000 + 0xABAB * a1 = 0xABCD, a0 = 0x9876 * b1 - 0xEFEF, b0 = 0xABAB * a1b1 = 0xA104C763 * a0b0 = 0x663CA8D2 * a1 + a0 = 0x14443 * b1 + b0 = 0x19B9A * -------------------------------------------------------------------- * (A104C763 * 100000000) + (((14443 * 19B9A) - (663CA8D2 + A104C763)) * 10000) + 663CA8D2 = * (A104C763 << (8 * 4)) + (((14443 * 19B9A) - (663CA8D2 + A104C763)) << (8 * 2)) + 663CA8D2 = A105C97C9755A8D2 * -------------------------------------------------------------------- * * Multiplying by B is t same as shifting by DIGIT_BITS. * DIGIT_BITS in this implementation is HCL_LIW_BITS * B => 2^HCL_LIW_BITS * X * B^n => X << (HCL_LIW_BITS * n) * X * B^2n => X << (HCL_LIW_BITS * n * 2) * -------------------------------------------------------------------- */ #if defined(HCL_BUILD_DEBUG) #define CANNOT_KARATSUBA(hcl,xs,ys) \ ((xs) < (hcl)->option.karatsuba_cutoff || (ys) < (hcl)->option.karatsuba_cutoff || \ ((xs) > (ys) && (ys) <= (((xs) + 1) / 2)) || \ ((xs) < (ys) && (xs) <= (((ys) + 1) / 2))) #else #define CANNOT_KARATSUBA(hcl,xs,ys) \ ((xs) < HCL_KARATSUBA_CUTOFF || (ys) < HCL_KARATSUBA_CUTOFF || \ ((xs) > (ys) && (ys) <= (((xs) + 1) / 2)) || \ ((xs) < (ys) && (xs) <= (((ys) + 1) / 2))) #endif static HCL_INLINE hcl_oow_t multiply_unsigned_array_karatsuba (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* z) { #if 1 hcl_lidw_t nshifts; hcl_lidw_t ndigits_xh, ndigits_xl; hcl_lidw_t ndigits_yh, ndigits_yl; hcl_liw_t* tmp[2] = { HCL_NULL, HCL_NULL}; hcl_liw_t* zsp; hcl_oow_t tmplen[2]; hcl_oow_t xlen, zcapa; zcapa = xs + ys; /* the caller ensures this capacity for z at the minimum*/ if (xs < ys) { hcl_oow_t i; /* swap x and y */ i = xs; xs = ys; ys = i; i = (hcl_oow_t)x; x = y; y = (hcl_liw_t*)i; } if (ys == 1) { hcl_lidw_t dw; hcl_liw_t carry = 0; hcl_oow_t i; for (i = 0; i < xs; i++) { dw = ((hcl_lidw_t)x[i] * y[0]) + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); z[i] = (hcl_liw_t)dw; } z[i] = carry; return count_effective(z, xs + 1); } /* calculate value of nshifts, that is 2^(HCL_LIW_BITS*nshifts) */ nshifts = (xs + 1) / 2; ndigits_xl = nshifts; /* ndigits of lower part of x */ ndigits_xh = xs - nshifts; /* ndigits of upper part of x */ ndigits_yl = nshifts; /* ndigits of lower part of y */ ndigits_yh = ys - nshifts; /* ndigits of uppoer part of y */ HCL_ASSERT (hcl, ndigits_xl >= ndigits_xh); HCL_ASSERT (hcl, ndigits_yl >= ndigits_yh); /* make a temporary buffer for (b0 + b1) and (a1 * b1) */ tmplen[0] = ndigits_xh + ndigits_yh; tmplen[1] = ndigits_yl + ndigits_yh + 1; if (tmplen[1] < tmplen[0]) tmplen[1] = tmplen[0]; tmp[1] = (hcl_liw_t*)hcl_callocmem(hcl, HCL_SIZEOF(hcl_liw_t) * tmplen[1]); /* TODO: should i use the object memory? */ if (!tmp[1]) goto oops; /* make a temporary for (a0 + a1) and (a0 * b0) */ tmplen[0] = ndigits_xl + ndigits_yl + 1; tmp[0] = (hcl_liw_t*)hcl_callocmem(hcl, HCL_SIZEOF(hcl_liw_t) * tmplen[0]); if (!tmp[0]) goto oops; /* tmp[0] = a0 + a1 */ tmplen[0] = add_unsigned_array(x, ndigits_xl, x + nshifts, ndigits_xh, tmp[0]); /* tmp[1] = b0 + b1 */ tmplen[1] = add_unsigned_array(y, ndigits_yl, y + nshifts, ndigits_yh, tmp[1]); /*HCL_DEBUG6 (hcl, "karatsuba t %p u %p ndigits_xl %d ndigits_xh %d ndigits_yl %d ndigits_yh %d\n", tmp[0], tmp[1], (int)ndigits_xl, (int)ndigits_xh, (int)ndigits_yl, (int)ndigits_yh);*/ /*HCL_DEBUG5 (hcl, "zcapa %d, tmplen[0] %d tmplen[1] %d nshifts %d total %d\n", (int)zcapa, (int)tmplen[0], (int)tmplen[1], (int)nshifts, (int)(tmplen[0] + tmplen[1] + nshifts));*/ /* place (a0 + a1) * (b0 + b1) at the shifted position */ zsp = z + nshifts; if (CANNOT_KARATSUBA(hcl, tmplen[0], tmplen[1])) { multiply_unsigned_array (tmp[0], tmplen[0], tmp[1], tmplen[1], zsp); xlen = count_effective(zsp, tmplen[0] + tmplen[1]); } else { xlen = multiply_unsigned_array_karatsuba(hcl, tmp[0], tmplen[0], tmp[1], tmplen[1], zsp); if (xlen == 0) goto oops; } /* tmp[0] = a0 * b0 */ tmplen[0] = ndigits_xl + ndigits_yl; HCL_MEMSET (tmp[0], 0, sizeof(hcl_liw_t) * tmplen[0]); if (CANNOT_KARATSUBA(hcl, ndigits_xl, ndigits_yl)) { multiply_unsigned_array (x, ndigits_xl, y, ndigits_yl, tmp[0]); tmplen[0] = count_effective(tmp[0], tmplen[0]); } else { tmplen[0] = multiply_unsigned_array_karatsuba(hcl, x, ndigits_xl, y, ndigits_yl, tmp[0]); if (tmplen[0] <= 0) goto oops; } /* tmp[1] = a1 * b1 */ tmplen[1] = ndigits_xh + ndigits_yh; HCL_MEMSET (tmp[1], 0, sizeof(hcl_liw_t) * tmplen[1]); if (CANNOT_KARATSUBA(hcl, ndigits_xh, ndigits_yh)) { multiply_unsigned_array (x + nshifts, ndigits_xh, y + nshifts, ndigits_yh, tmp[1]); tmplen[1] = count_effective(tmp[1], tmplen[1]); } else { tmplen[1] = multiply_unsigned_array_karatsuba(hcl, x + nshifts, ndigits_xh, y + nshifts, ndigits_yh, tmp[1]); if (tmplen[1] <= 0) goto oops; } /* (a0+a1)*(b0+b1) -(a0*b0) */ xlen = subtract_unsigned_array(hcl, zsp, xlen, tmp[0], tmplen[0], zsp); /* (a0+a1)*(b0+b1) - (a0*b0) - (a1*b1) */ xlen = subtract_unsigned_array(hcl, zsp, xlen, tmp[1], tmplen[1], zsp); /* a1b1 is in tmp[1]. add (a1b1 * B^2n) to the high part of 'z' */ zsp = z + (nshifts * 2); /* emulate shifting for "* B^2n". */ xlen = zcapa - (nshifts * 2); xlen = add_unsigned_array(zsp, xlen, tmp[1], tmplen[1], zsp); /* z = z + a0b0. a0b0 is in tmp[0] */ xlen = add_unsigned_array(z, zcapa, tmp[0], tmplen[0], z); hcl_freemem (hcl, tmp[1]); hcl_freemem (hcl, tmp[0]); return count_effective (z, xlen); oops: if (tmp[1]) hcl_freemem (hcl, tmp[1]); if (tmp[0]) hcl_freemem (hcl, tmp[0]); return 0; #else hcl_lidw_t nshifts; hcl_lidw_t ndigits_xh, ndigits_xl; hcl_lidw_t ndigits_yh, ndigits_yl; hcl_liw_t* tmp[3] = { HCL_NULL, HCL_NULL, HCL_NULL }; hcl_liw_t* zsp; hcl_oow_t tmplen[3]; hcl_oow_t xlen, zcapa; zcapa = xs + ys; /* the caller ensures this capacity for z at the minimum*/ if (xs < ys) { hcl_oow_t i; /* swap x and y */ i = xs; xs = ys; ys = i; i = (hcl_oow_t)x; x = y; y = (hcl_liw_t*)i; } if (ys == 1) { hcl_lidw_t dw; hcl_liw_t carry = 0; hcl_oow_t i; for (i = 0; i < xs; i++) { dw = ((hcl_lidw_t)x[i] * y[0]) + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); z[i] = (hcl_liw_t)dw; } z[i] = carry; return; } /* calculate value of nshifts, that is 2^(HCL_LIW_BITS*nshifts) */ nshifts = (xs + 1) / 2; ndigits_xl = nshifts; /* ndigits of lower part of x */ ndigits_xh = xs - nshifts; /* ndigits of upper part of x */ ndigits_yl = nshifts; /* ndigits of lower part of y */ ndigits_yh = ys - nshifts; /* ndigits of uppoer part of y */ HCL_ASSERT (hcl, ndigits_xl >= ndigits_xh); HCL_ASSERT (hcl, ndigits_yl >= ndigits_yh); /* make a temporary buffer for (b0 + b1) and (a1 * b1) */ tmplen[0] = ndigits_yl + ndigits_yh + 1; tmplen[1] = ndigits_xh + ndigits_yh; if (tmplen[1] < tmplen[0]) tmplen[1] = tmplen[0]; tmp[1] = hcl_callocmem(hcl, HCL_SIZEOF(hcl_liw_t) * tmplen[1]); if (!tmp[1]) goto oops; /* make a temporary for (a0 + a1) and (a0 * b0) */ tmplen[0] = ndigits_xl + ndigits_yl; tmp[0] = hcl_callocmem(hcl, HCL_SIZEOF(hcl_liw_t) * tmplen[0]); if (!tmp[0]) goto oops; /* tmp[0] = a0 + a1 */ tmplen[0] = add_unsigned_array(x, ndigits_xl, x + nshifts, ndigits_xh, tmp[0]); /* tmp[1] = b0 + b1 */ tmplen[1] = add_unsigned_array(y, ndigits_yl, y + nshifts, ndigits_yh, tmp[1]); /* tmp[2] = (a0 + a1) * (b0 + b1) */ tmplen[2] = tmplen[0] + tmplen[1]; tmp[2] = hcl_callocmem (hcl, HCL_SIZEOF(hcl_liw_t) * tmplen[2]); if (!tmp[2]) goto oops; if (CANNOT_KARATSUBA(hcl, tmplen[0], tmplen[1])) { multiply_unsigned_array (tmp[0], tmplen[0], tmp[1], tmplen[1], tmp[2]); xlen = count_effective(tmp[2], tmplen[2]); } else { xlen = multiply_unsigned_array_karatsuba(hcl, tmp[0], tmplen[0], tmp[1], tmplen[1], tmp[2]); if (xlen == 0) goto oops; } /* tmp[0] = a0 * b0 */ tmplen[0] = ndigits_xl + ndigits_yl; HCL_MEMSET (tmp[0], 0, sizeof(hcl_liw_t) * tmplen[0]); if (CANNOT_KARATSUBA(hcl, ndigits_xl, ndigits_yl)) { multiply_unsigned_array (x, ndigits_xl, y, ndigits_yl, tmp[0]); tmplen[0] = count_effective(tmp[0], tmplen[0]); } else { tmplen[0] = multiply_unsigned_array_karatsuba(hcl, x, ndigits_xl, y, ndigits_yl, tmp[0]); if (tmplen[0] <= 0) goto oops; } /* tmp[1] = a1 * b1 */ tmplen[1] = ndigits_xh + ndigits_yh; HCL_MEMSET (tmp[1], 0, sizeof(hcl_liw_t) * tmplen[1]); if (CANNOT_KARATSUBA(hcl, ndigits_xh, ndigits_yh)) { multiply_unsigned_array (x + nshifts, ndigits_xh, y + nshifts, ndigits_yh, tmp[1]); tmplen[1] = count_effective(tmp[1], tmplen[1]); } else { tmplen[1] = multiply_unsigned_array_karatsuba(hcl, x + nshifts, ndigits_xh, y + nshifts, ndigits_yh, tmp[1]); if (tmplen[1] <= 0) goto oops; } /* w = w - tmp[0] */ xlen = subtract_unsigned_array(hcl, tmp[2], xlen, tmp[0], tmplen[0], tmp[2]); /* r = w - tmp[1] */ zsp = z + nshifts; /* emulate shifting for "* B^n" */ xlen = subtract_unsigned_array(hcl, tmp[2], xlen, tmp[1], tmplen[1], zsp); /* a1b1 is in tmp[1]. add (a1b1 * B^2n) to the high part of 'z' */ zsp = z + (nshifts * 2); /* emulate shifting for "* B^2n". */ xlen = zcapa - (nshifts * 2); xlen = add_unsigned_array(zsp, xlen, tmp[1], tmplen[1], zsp); /* z = z + a0b0. a0b0 is in tmp[0] */ xlen = add_unsigned_array(z, zcapa, tmp[0], tmplen[0], z); hcl_freemem (hcl, tmp[2]); hcl_freemem (hcl, tmp[1]); hcl_freemem (hcl, tmp[0]); return count_effective(z, xlen); oops: if (tmp[2]) hcl_freemem (hcl, tmp[2]); if (tmp[1]) hcl_freemem (hcl, tmp[1]); if (tmp[0]) hcl_freemem (hcl, tmp[0]); return 0; #endif } static HCL_INLINE void lshift_unsigned_array (hcl_liw_t* x, hcl_oow_t xs, hcl_oow_t bits) { /* this function doesn't grow/shrink the array. Shifting is performed * over the given array */ hcl_oow_t word_shifts, bit_shifts, bit_shifts_right; hcl_oow_t si, di; /* get how many words to shift */ word_shifts = bits / HCL_LIW_BITS; if (word_shifts >= xs) { HCL_MEMSET (x, 0, xs * HCL_SIZEOF(hcl_liw_t)); return; } /* get how many remaining bits to shift */ bit_shifts = bits % HCL_LIW_BITS; bit_shifts_right = HCL_LIW_BITS - bit_shifts; /* shift words and bits */ di = xs - 1; si = di - word_shifts; x[di] = x[si] << bit_shifts; while (di > word_shifts) { x[di] = x[di] | (x[--si] >> bit_shifts_right); x[--di] = x[si] << bit_shifts; } /* fill the remaining part with zeros */ if (word_shifts > 0) HCL_MEMSET (x, 0, word_shifts * HCL_SIZEOF(hcl_liw_t)); } static HCL_INLINE void rshift_unsigned_array (hcl_liw_t* x, hcl_oow_t xs, hcl_oow_t bits) { /* this function doesn't grow/shrink the array. Shifting is performed * over the given array */ hcl_oow_t word_shifts, bit_shifts, bit_shifts_left; hcl_oow_t si, di, bound; /* get how many words to shift */ word_shifts = bits / HCL_LIW_BITS; if (word_shifts >= xs) { HCL_MEMSET (x, 0, xs * HCL_SIZEOF(hcl_liw_t)); return; } /* get how many remaining bits to shift */ bit_shifts = bits % HCL_LIW_BITS; bit_shifts_left = HCL_LIW_BITS - bit_shifts; /* TODO: verify this function */ /* shift words and bits */ di = 0; si = word_shifts; x[di] = x[si] >> bit_shifts; bound = xs - word_shifts - 1; while (di < bound) { x[di] = x[di] | (x[++si] << bit_shifts_left); x[++di] = x[si] >> bit_shifts; } /* fill the remaining part with zeros */ if (word_shifts > 0) HCL_MEMSET (&x[xs - word_shifts], 0, word_shifts * HCL_SIZEOF(hcl_liw_t)); } static void divide_unsigned_array (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* q, hcl_liw_t* r) { /* TODO: this function needs to be rewritten for performance improvement. * the binary long division is extremely slow for a big number */ /* Perform binary long division. * http://en.wikipedia.org/wiki/Division_algorithm * --------------------------------------------------------------------- * Q := 0 initialize quotient and remainder to zero * R := 0 * for i = n-1...0 do where n is number of bits in N * R := R << 1 left-shift R by 1 bit * R(0) := X(i) set the least-significant bit of R equal to bit i of the numerator * if R >= Y then * R = R - Y * Q(i) := 1 * end * end */ hcl_oow_t rs, rrs, i , j; HCL_ASSERT (hcl, xs >= ys); /* the caller must ensure: * - q and r are all zeros. can skip memset() with zero. * - q is as large as xs in size. * - r is as large as ys + 1 in size */ /*HCL_MEMSET (q, 0, HCL_SIZEOF(*q) * xs); HCL_MEMSET (r, 0, HCL_SIZEOF(*q) * ys);*/ rrs = ys + 1; for (i = xs; i > 0; ) { --i; for (j = HCL_LIW_BITS; j > 0;) { --j; /* the value of the remainder 'r' may get bigger than the * divisor 'y' temporarily until subtraction is performed * below. so ys + 1(kept in rrs) is needed for shifting here. */ lshift_unsigned_array (r, rrs, 1); HCL_SETBITS (hcl_liw_t, r[0], 0, 1, HCL_GETBITS(hcl_liw_t, x[i], j, 1)); rs = count_effective(r, rrs); if (!is_less_unsigned_array(r, rs, y, ys)) { subtract_unsigned_array (hcl, r, rs, y, ys, r); HCL_SETBITS (hcl_liw_t, q[i], j, 1, 1); } } } } static HCL_INLINE hcl_liw_t calculate_remainder (hcl_t* hcl, hcl_liw_t* qr, hcl_liw_t* y, hcl_liw_t quo, int qr_start, int stop) { hcl_lidw_t dw; hcl_liw_t b, c, c2, qyk; hcl_oow_t j, k; for (b = 0, c = 0, c2 = 0, j = qr_start, k = 0; k < stop; j++, k++) { dw = (hcl_lidw_t)qr[j] - b; b = (hcl_liw_t)((dw >> HCL_LIW_BITS) & 1); /* b = -(dw mod BASE) */ qr[j] = (hcl_liw_t)dw; dw = ((hcl_lidw_t)y[k] * quo) + c; c = (hcl_liw_t)(dw >> HCL_LIW_BITS); qyk = (hcl_liw_t)dw; dw = (hcl_lidw_t)qr[j] - qyk; c2 = (hcl_liw_t)((dw >> HCL_LIW_BITS) & 1); qr[j] = (hcl_liw_t)dw; dw = (hcl_lidw_t)b + c2 + c; c = (hcl_liw_t)(dw >> HCL_LIW_BITS); b = (hcl_liw_t)dw; HCL_ASSERT (hcl, c == 0); } return b; } static void divide_unsigned_array2 (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* q, hcl_liw_t* r) { hcl_oow_t i; hcl_liw_t d, y1, y2; /* the caller must ensure: * - q can hold 'xs + 1' words and r can hold 'ys' words. * - q and r are set to all zeros. */ HCL_ASSERT (hcl, xs >= ys); if (ys == 1) { /* the divisor has a single word only. perform simple division */ hcl_lidw_t dw; hcl_liw_t carry = 0; for (i = xs; i > 0; ) { --i; dw = ((hcl_lidw_t)carry << HCL_LIW_BITS) + x[i]; q[i] = (hcl_liw_t)(dw / y[0]); carry = (hcl_liw_t)(dw % y[0]); } r[0] = carry; return; } for (i = 0; i < xs; i++) q[i] = x[i]; /* copy x to q */ q[xs] = 0; /* store zero in the last extra word */ for (i = 0; i < ys; i++) r[i] = y[i]; /* copy y to r */ y1 = r[ys - 1]; /* highest divisor word */ /*d = (y1 == HCL_TYPE_MAX(hcl_liw_t)? ((hcl_liw_t)1): ((hcl_liw_t)(((hcl_lidw_t)1 << HCL_LIW_BITS) / (y1 + 1))));*/ d = (hcl_liw_t)(((hcl_lidw_t)1 << HCL_LIW_BITS) / ((hcl_lidw_t)y1 + 1)); if (d > 1) { hcl_lidw_t dw; hcl_liw_t carry; /* shift the divisor such that its high-order bit is on. * shift the dividend the same amount as the previous step */ /* r = r * d */ for (carry = 0, i = 0; i < ys; i++) { dw = ((hcl_lidw_t)r[i] * d) + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); r[i] = (hcl_liw_t)dw; } HCL_ASSERT (hcl, carry == 0); /* q = q * d */ for (carry = 0, i = 0; i < xs; i++) { dw = ((hcl_lidw_t)q[i] * d) + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); q[i] = (hcl_liw_t)dw; } q[xs] = carry; } y1 = r[ys - 1]; y2 = r[ys - 2]; for (i = xs; i >= ys; --i) { hcl_lidw_t dw, quo, rem; hcl_liw_t b, xhi, xlo; /* ---------------------------------------------------------- */ /* estimate the quotient. * 2-current-dividend-words / 2-most-significant-divisor-words */ xhi = q[i]; xlo = q[i - 1]; /* adjust the quotient if over-estimated */ dw = ((hcl_lidw_t)xhi << HCL_LIW_BITS) + xlo; /* TODO: optimize it with ASM - no seperate / and % */ quo = dw / y1; rem = dw % y1; adjust_quotient: if (quo > HCL_TYPE_MAX(hcl_liw_t) || (quo * y2) > ((rem << HCL_LIW_BITS) + q[i - 2])) { --quo; rem += y1; if (rem <= HCL_TYPE_MAX(hcl_liw_t)) goto adjust_quotient; } /* ---------------------------------------------------------- */ b = calculate_remainder(hcl, q, r, quo, i - ys, ys); b = (hcl_liw_t)((((hcl_lidw_t)xhi - b) >> HCL_LIW_BITS) & 1); /* is the sign bit set? */ if (b) { /* yes. underflow */ hcl_lidw_t dw; hcl_liw_t carry; hcl_oow_t j, k; for (carry = 0, j = i - ys, k = 0; k < ys; j++, k++) { dw = (hcl_lidw_t)q[j] + r[k] + carry; carry = (hcl_liw_t)(dw >> HCL_LIW_BITS); q[j] = (hcl_liw_t)dw; } HCL_ASSERT (hcl, carry == 1); q[i] = quo - 1; } else { q[i] = quo; } } if (d > 1) { hcl_lidw_t dw; hcl_liw_t carry; for (carry = 0, i = ys; i > 0; ) { --i; dw = ((hcl_lidw_t)carry << HCL_LIW_BITS) + q[i]; /* TODO: optimize it with ASM - no seperate / and % */ q[i] = (hcl_liw_t)(dw / d); carry = (hcl_liw_t)(dw % d); } } /* split quotient and remainder held in q to q and r respectively * q [<--- quotient ---->|<-- remainder -->] * index |xs xs-1 ... ys+1 ys|ys-1 ys-2 ... 1 0| */ for (i = 0; i < ys; i++) { r[i] = q[i]; q[i] = 0; } for (; i <= xs; i++) { q[i - ys] = q[i]; q[i] = 0; } } static void divide_unsigned_array3 (hcl_t* hcl, const hcl_liw_t* x, hcl_oow_t xs, const hcl_liw_t* y, hcl_oow_t ys, hcl_liw_t* q, hcl_liw_t* r) { hcl_oow_t s, i, j, g, k; hcl_lidw_t dw, qhat, rhat; hcl_lidi_t di, ci; hcl_liw_t* qq, y1, y2; /* the caller must ensure: * - q can hold 'xs + 1' words and r can hold 'ys' words. * - q and r are set to all zeros. */ HCL_ASSERT (hcl, xs >= ys); if (ys == 1) { /* the divisor has a single word only. perform simple division */ hcl_lidw_t dw; hcl_liw_t carry = 0; for (i = xs; i > 0; ) { --i; dw = ((hcl_lidw_t)carry << HCL_LIW_BITS) + x[i]; q[i] = (hcl_liw_t)(dw / y[0]); carry = (hcl_liw_t)(dw % y[0]); } r[0] = carry; return; } #define SHARED_QQ #if defined(SHARED_QQ) /* as long as q is 2 words longer than x, this algorithm can store * both quotient and remainder in q at the same time. */ qq = q; #else /* this part requires an extra buffer. proper error handling isn't easy * since the return type of this function is void */ if (hcl->inttostr.t.capa <= xs) { hcl_liw_t* t; hcl_oow_t reqcapa; reqcapa = HCL_ALIGN_POW2(xs + 1, 32); t = (hcl_liw_t*)hcl_reallocmem(hcl, hcl->inttostr.t.ptr, reqcapa * HCL_SIZEOF(*t)); /* TODO: TODO: TODO: ERROR HANDLING if (!t) return -1; */ hcl->inttostr.t.capa = xs + 1; hcl->inttostr.t.ptr = t; } qq = hcl->inttostr.t.ptr; #endif y1 = y[ys - 1]; /*s = HCL_LIW_BITS - ((y1 == 0)? -1: hcl_get_pos_of_msb_set(y1)) - 1;*/ HCL_ASSERT (hcl, y1 > 0); /* the highest word can't be non-zero in the context where this function is called */ s = HCL_LIW_BITS - hcl_get_pos_of_msb_set(y1) - 1; for (i = ys; i > 1; ) { --i; r[i] = (y[i] << s) | ((hcl_lidw_t)y[i - 1] >> (HCL_LIW_BITS - s)); } r[0] = y[0] << s; qq[xs] = (hcl_lidw_t)x[xs - 1] >> (HCL_LIW_BITS - s); for (i = xs; i > 1; ) { --i; qq[i] = (x[i] << s) | ((hcl_lidw_t)x[i - 1] >> (HCL_LIW_BITS - s)); } qq[0] = x[0] << s; y1 = r[ys - 1]; y2 = r[ys - 2]; for (j = xs; j >= ys; --j) { g = j - ys; /* position where remainder begins in qq */ /* estimate */ dw = ((hcl_lidw_t)qq[j] << HCL_LIW_BITS) + qq[j - 1]; qhat = dw / y1; rhat = dw - (qhat * y1); adjust_quotient: if (qhat > HCL_TYPE_MAX(hcl_liw_t) || (qhat * y2) > ((rhat << HCL_LIW_BITS) + qq[j - 2])) { qhat = qhat - 1; rhat = rhat + y1; if (rhat <= HCL_TYPE_MAX(hcl_liw_t)) goto adjust_quotient; } /* multiply and subtract */ for (ci = 0, i = g, k = 0; k < ys; i++, k++) { dw = qhat * r[k]; di = qq[i] - ci - (dw & HCL_TYPE_MAX(hcl_liw_t)); ci = (dw >> HCL_LIW_BITS) - (di >> HCL_LIW_BITS); qq[i] = (hcl_liw_t)di; } HCL_ASSERT (hcl, i == j); di = qq[i] - ci; qq[i] = di; /* test remainder */ if (di < 0) { for (ci = 0, i = g, k = 0; k < ys; i++, k++) { di = (hcl_lidw_t)qq[i] + r[k] + ci; ci = (hcl_liw_t)(di >> HCL_LIW_BITS); qq[i] = (hcl_liw_t)di; } HCL_ASSERT (hcl, i == j); /*HCL_ASSERT (hcl, ci == 1);*/ qq[i] += ci; #if defined(SHARED_QQ) /* store the quotient word right after the remainder in q */ q[i + 1] = qhat - 1; #else q[g] = qhat - 1; #endif } else { #if defined(SHARED_QQ) /* store the quotient word right after the remainder in q */ q[i + 1] = qhat; #else q[g] = qhat; #endif } } for (i = 0; i < ys - 1; i++) { r[i] = (qq[i] >> s) | ((hcl_lidw_t)qq[i + 1] << (HCL_LIW_BITS - s)); } r[i] = qq[i] >> s; #if defined(SHARED_QQ) for (i = 0; i <= ys; i++) { q[i] = 0; } for (; i <= xs + 1; i++) { q[i - ys - 1] = q[i]; q[i] = 0; } #endif } /* ======================================================================== */ static hcl_oop_t add_unsigned_integers (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oow_t as, bs, zs; hcl_oop_t z; as = HCL_OBJ_GET_SIZE(x); bs = HCL_OBJ_GET_SIZE(y); zs = (as >= bs? as: bs); if (zs >= HCL_OBJ_SIZE_MAX) { hcl_seterrnum (hcl, HCL_EOOMEM); /* TOOD: is it a soft failure or hard failure? */ return HCL_NULL; } zs++; hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_OBJ_GET_FLAGS_BRAND(x), HCL_NULL, zs); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; add_unsigned_array ( ((hcl_oop_liword_t)x)->slot, as, ((hcl_oop_liword_t)y)->slot, bs, ((hcl_oop_liword_t)z)->slot ); return z; } static hcl_oop_t subtract_unsigned_integers (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; HCL_ASSERT (hcl, !is_less_unsigned(x, y)); hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(x)); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; subtract_unsigned_array (hcl, ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y), ((hcl_oop_liword_t)z)->slot); return z; } static hcl_oop_t multiply_unsigned_integers (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; hcl_oow_t xs, ys; xs = HCL_OBJ_GET_SIZE(x); ys = HCL_OBJ_GET_SIZE(y); if (ys > HCL_OBJ_SIZE_MAX - xs) { hcl_seterrnum (hcl, HCL_EOOMEM); /* TOOD: is it a soft failure or hard failure? */ return HCL_NULL; } hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, xs + ys); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; #if defined(HCL_ENABLE_KARATSUBA) if (CANNOT_KARATSUBA(hcl, xs, ys)) { #endif multiply_unsigned_array ( ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y), ((hcl_oop_liword_t)z)->slot); #if defined(HCL_ENABLE_KARATSUBA) } else { if (multiply_unsigned_array_karatsuba ( hcl, ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y), ((hcl_oop_liword_t)z)->slot) == 0) return HCL_NULL; } #endif return z; } static hcl_oop_t divide_unsigned_integers (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y, hcl_oop_t* r) { hcl_oop_t qq, rr; if (is_less_unsigned(x, y)) { rr = clone_bigint(hcl, x, HCL_OBJ_GET_SIZE(x)); if (!rr) return HCL_NULL; hcl_pushvolat (hcl, &rr); qq = make_bigint_with_ooi(hcl, 0); /* TODO: inefficient. no need to create a bigint object for zero. */ hcl_popvolat (hcl); if (qq) *r = rr; return qq; } else if (is_equal_unsigned(x, y)) { rr = make_bigint_with_ooi(hcl, 0); /* TODO: inefficient. no need to create a bigint object for zero. */ if (!rr) return HCL_NULL; hcl_pushvolat (hcl, &rr); qq = make_bigint_with_ooi(hcl, 1); /* TODO: inefficient. no need to create a bigint object for zero. */ hcl_popvolat (hcl); if (qq) *r = rr; return qq; } /* the caller must ensure that x >= y */ HCL_ASSERT (hcl, !is_less_unsigned(x, y)); hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); #define USE_DIVIDE_UNSIGNED_ARRAY2 /*#define USE_DIVIDE_UNSIGNED_ARRAY3*/ #if defined(USE_DIVIDE_UNSIGNED_ARRAY3) qq = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(x) + 2); #elif defined(USE_DIVIDE_UNSIGNED_ARRAY2) qq = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(x) + 1); #else qq = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(x)); #endif if (!qq) { hcl_popvolats (hcl, 2); return HCL_NULL; } hcl_pushvolat (hcl, &qq); #if defined(USE_DIVIDE_UNSIGNED_ARRAY3) rr = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(y)); #elif defined(USE_DIVIDE_UNSIGNED_ARRAY2) rr = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(y)); #else rr = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, HCL_OBJ_GET_SIZE(y) + 1); #endif hcl_popvolats (hcl, 3); if (!rr) return HCL_NULL; #if defined(USE_DIVIDE_UNSIGNED_ARRAY3) divide_unsigned_array3 (hcl, #elif defined(USE_DIVIDE_UNSIGNED_ARRAY2) divide_unsigned_array2 (hcl, #else divide_unsigned_array (hcl, #endif ((hcl_oop_liword_t)x)->slot, HCL_OBJ_GET_SIZE(x), ((hcl_oop_liword_t)y)->slot, HCL_OBJ_GET_SIZE(y), ((hcl_oop_liword_t)qq)->slot, ((hcl_oop_liword_t)rr)->slot); *r = rr; return qq; } /* ======================================================================== */ hcl_oop_t hcl_addints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t i; /* no integer overflow/underflow must occur as the possible integer * range is narrowed by the tag bits used */ HCL_ASSERT (hcl, HCL_SMOOI_MAX + HCL_SMOOI_MAX < HCL_TYPE_MAX(hcl_ooi_t)); HCL_ASSERT (hcl, HCL_SMOOI_MIN + HCL_SMOOI_MIN > HCL_TYPE_MIN(hcl_ooi_t)); i = HCL_OOP_TO_SMOOI(x) + HCL_OOP_TO_SMOOI(y); if (HCL_IN_SMOOI_RANGE(i)) return HCL_SMOOI_TO_OOP(i); return make_bigint_with_ooi (hcl, i); } else { hcl_ooi_t v; if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl,y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) return clone_bigint (hcl, y, HCL_OBJ_GET_SIZE(y)); hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl,x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return clone_bigint (hcl, x, HCL_OBJ_GET_SIZE(x)); hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!y) return HCL_NULL; } else { if (!hcl_isbigint(hcl,x)) goto oops_einval; if (!hcl_isbigint(hcl,y)) goto oops_einval; } if (HCL_OBJ_GET_FLAGS_BRAND(x) != HCL_OBJ_GET_FLAGS_BRAND(y)) { if (HCL_IS_NBIGINT(hcl, x)) { /* x is negative, y is positive */ if (is_less_unsigned (x, y)) { z = subtract_unsigned_integers (hcl, y, x); if (!z) return HCL_NULL; } else { z = subtract_unsigned_integers (hcl, x, y); if (!z) return HCL_NULL; HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } } else { /* x is positive, y is negative */ if (is_less_unsigned (x, y)) { z = subtract_unsigned_integers (hcl, y, x); if (!z) return HCL_NULL; HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else { z = subtract_unsigned_integers (hcl, x, y); if (!z) return HCL_NULL; } } } else { int neg; /* both are positive or negative */ neg = HCL_IS_NBIGINT(hcl, x); z = add_unsigned_integers (hcl, x, y); if (!z) return HCL_NULL; if (neg) HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } } return normalize_bigint (hcl, z); oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_subints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t i; /* no integer overflow/underflow must occur as the possible integer * range is narrowed by the tag bits used */ HCL_ASSERT (hcl, HCL_SMOOI_MAX - HCL_SMOOI_MIN < HCL_TYPE_MAX(hcl_ooi_t)); HCL_ASSERT (hcl, HCL_SMOOI_MIN - HCL_SMOOI_MAX > HCL_TYPE_MIN(hcl_ooi_t)); i = HCL_OOP_TO_SMOOI(x) - HCL_OOP_TO_SMOOI(y); if (HCL_IN_SMOOI_RANGE(i)) return HCL_SMOOI_TO_OOP(i); return make_bigint_with_ooi (hcl, i); } else { hcl_ooi_t v; int neg; if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl,y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) { /* switch the sign to the opposite and return it */ return clone_bigint_negated (hcl, y, HCL_OBJ_GET_SIZE(y)); } hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl,x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return clone_bigint (hcl, x, HCL_OBJ_GET_SIZE(x)); hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!y) return HCL_NULL; } else { if (!hcl_isbigint(hcl,x)) goto oops_einval; if (!hcl_isbigint(hcl,y)) goto oops_einval; } if (HCL_OBJ_GET_FLAGS_BRAND(x) != HCL_OBJ_GET_FLAGS_BRAND(y)) { neg = HCL_IS_NBIGINT(hcl, x); z = add_unsigned_integers (hcl, x, y); if (!z) return HCL_NULL; if (neg) HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else { /* both are positive or negative */ if (is_less_unsigned (x, y)) { neg = HCL_IS_NBIGINT(hcl, x); z = subtract_unsigned_integers (hcl, y, x); if (!z) return HCL_NULL; if (!neg) HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else { neg = HCL_IS_NBIGINT(hcl, x); z = subtract_unsigned_integers (hcl, x, y); /* take x's sign */ if (!z) return HCL_NULL; if (neg) HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } } } return normalize_bigint (hcl, z); oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_mulints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { #if (HCL_SIZEOF_INTMAX_T > HCL_SIZEOF_OOI_T) hcl_intmax_t i; i = (hcl_intmax_t)HCL_OOP_TO_SMOOI(x) * (hcl_intmax_t)HCL_OOP_TO_SMOOI(y); if (HCL_IN_SMOOI_RANGE(i)) return HCL_SMOOI_TO_OOP((hcl_ooi_t)i); return make_bigint_with_intmax (hcl, i); #else hcl_ooi_t i; hcl_ooi_t xv, yv; xv = HCL_OOP_TO_SMOOI(x); yv = HCL_OOP_TO_SMOOI(y); if (shcli_mul_overflow (hcl, xv, yv, &i)) { /* overflowed - convert x and y normal objects and carry on */ /* no need to call hcl_pushvolat before creating x because * xv and yv contains actual values needed */ x = make_bigint_with_ooi (hcl, xv); if (!x) return HCL_NULL; hcl_pushvolat (hcl, &x); /* protect x made above */ y = make_bigint_with_ooi (hcl, yv); hcl_popvolat (hcl); if (!y) return HCL_NULL; goto full_multiply; } else { if (HCL_IN_SMOOI_RANGE(i)) return HCL_SMOOI_TO_OOP(i); return make_bigint_with_ooi (hcl, i); } #endif } else { hcl_ooi_t v; int neg; if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl,y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); switch (v) { case 0: return HCL_SMOOI_TO_OOP(0); case 1: return clone_bigint (hcl, y, HCL_OBJ_GET_SIZE(y)); case -1: return clone_bigint_negated (hcl, y, HCL_OBJ_GET_SIZE(y)); } hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl,x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); switch (v) { case 0: return HCL_SMOOI_TO_OOP(0); case 1: return clone_bigint (hcl, x, HCL_OBJ_GET_SIZE(x)); case -1: return clone_bigint_negated (hcl, x, HCL_OBJ_GET_SIZE(x)); } hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!y) return HCL_NULL; } else { if (!hcl_isbigint(hcl,x)) goto oops_einval; if (!hcl_isbigint(hcl,y)) goto oops_einval; } full_multiply: neg = (HCL_OBJ_GET_FLAGS_BRAND(x) != HCL_OBJ_GET_FLAGS_BRAND(y)); z = multiply_unsigned_integers (hcl, x, y); if (!z) return HCL_NULL; if (neg) HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } return normalize_bigint (hcl, z); oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_divints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y, int modulo, hcl_oop_t* rem) { hcl_oop_t z, r; int x_neg_sign, y_neg_sign; if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t xv, yv, q, ri; xv = HCL_OOP_TO_SMOOI(x); yv = HCL_OOP_TO_SMOOI(y); if (yv == 0) { hcl_seterrnum (hcl, HCL_EDIVBY0); return HCL_NULL; } if (xv == 0) { if (rem) *rem = HCL_SMOOI_TO_OOP(0); return HCL_SMOOI_TO_OOP(0); } /* In C89, integer division with a negative number is * implementation dependent. In C99, it truncates towards zero. * * http://python-history.blogspot.kr/2010/08/why-pythons-integer-division-floors.html * The integer division operation (//) and its sibling, * the modulo operation (%), go together and satisfy a nice * mathematical relationship (all variables are integers): * a/b = q with remainder r * such that * b*q + r = a and 0 <= r < b (assuming- a and b are >= 0). * * If you want the relationship to extend for negative a * (keeping b positive), you have two choices: if you truncate q * towards zero, r will become negative, so that the invariant * changes to 0 <= abs(r) < abs(b). otherwise, you can floor q * towards negative infinity, and the invariant remains 0 <= r < b. */ q = xv / yv; HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(q)); ri = xv - yv * q; /* xv % yv; */ if (ri) { if (modulo) { /* modulo */ /* xv yv q r ------------------------- 7 3 2 1 -7 3 -3 2 7 -3 -3 -2 -7 -3 2 -1 */ /* r must be floored. that is, it rounds away from zero * and towards negative infinity */ if (IS_SIGN_DIFF(yv, ri)) { /* if the divisor has a different sign from r, * change the sign of r to the divisor's sign */ ri += yv; --q; HCL_ASSERT (hcl, ri && !IS_SIGN_DIFF(yv, ri)); } } else { /* remainder */ /* xv yv q r ------------------------- 7 3 2 1 -7 3 -2 -1 7 -3 -2 1 -7 -3 2 -1 */ if (xv && IS_SIGN_DIFF(xv, ri)) { /* if the dividend has a different sign from r, * change the sign of r to the dividend's sign. * all the compilers i've worked with produced * the quotient and the remainder that don't need * any adjustment. however, there may be an esoteric * architecture. */ ri -= yv; ++q; HCL_ASSERT (hcl, xv && !IS_SIGN_DIFF(xv, ri)); } } } if (rem) { HCL_ASSERT (hcl, HCL_IN_SMOOI_RANGE(ri)); *rem = HCL_SMOOI_TO_OOP(ri); } return HCL_SMOOI_TO_OOP((hcl_ooi_t)q); } else { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t xv; if (!hcl_isbigint(hcl,y)) goto oops_einval; /* divide a small integer by a big integer. * the dividend is guaranteed to be greater than the divisor * if both are positive. */ xv = HCL_OOP_TO_SMOOI(x); x_neg_sign = (xv < 0); y_neg_sign = HCL_IS_NBIGINT(hcl, y); if (x_neg_sign == y_neg_sign || !modulo) { /* simple. the quotient is zero and the * dividend becomes the remainder as a whole. */ if (rem) *rem = x; return HCL_SMOOI_TO_OOP(0); } /* carry on to the full bigint division */ hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi(hcl, xv); hcl_popvolat (hcl); if (!x) return HCL_NULL; } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t yv; if (!hcl_isbigint(hcl,x)) goto oops_einval; /* divide a big integer by a small integer. */ yv = HCL_OOP_TO_SMOOI(y); switch (yv) { case 0: hcl_seterrnum (hcl, HCL_EDIVBY0); return HCL_NULL; case 1: z = clone_bigint(hcl, x, HCL_OBJ_GET_SIZE(x)); if (!z) return HCL_NULL; if (rem) *rem = HCL_SMOOI_TO_OOP(0); return z; case -1: z = clone_bigint_negated(hcl, x, HCL_OBJ_GET_SIZE(x)); if (!z) return HCL_NULL; if (rem) *rem = HCL_SMOOI_TO_OOP(0); return z; default: { hcl_lidw_t dw; hcl_liw_t carry = 0; hcl_liw_t* zw; hcl_oow_t zs, i; hcl_ooi_t yv_abs, ri; yv_abs = (yv < 0)? -yv: yv; #if (HCL_LIW_BITS < HCL_OOI_BITS) if (yv_abs > HCL_TYPE_MAX(hcl_liw_t)) break; #endif x_neg_sign = (HCL_IS_NBIGINT(hcl, x)); y_neg_sign = (yv < 0); z = clone_bigint_to_positive(hcl, x, HCL_OBJ_GET_SIZE(x)); if (!z) return HCL_NULL; zw = ((hcl_oop_liword_t)z)->slot; zs = HCL_OBJ_GET_SIZE(z); for (i = zs; i > 0; ) { --i; dw = ((hcl_lidw_t)carry << HCL_LIW_BITS) + zw[i]; /* TODO: optimize it with ASM - no seperate / and % */ zw[i] = (hcl_liw_t)(dw / yv_abs); carry = (hcl_liw_t)(dw % yv_abs); } /*if (zw[zs - 1] == 0) zs--;*/ HCL_ASSERT (hcl, carry <= HCL_SMOOI_MAX); ri = carry; if (x_neg_sign) ri = -ri; z = normalize_bigint(hcl, z); if (!z) return HCL_NULL; if (x_neg_sign != y_neg_sign) { HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); if (ri && modulo) { z = hcl_subints(hcl, z, HCL_SMOOI_TO_OOP(1)); if (!z) return HCL_NULL; if (rem) { hcl_pushvolat (hcl, &z); r = hcl_addints(hcl, HCL_SMOOI_TO_OOP(ri), HCL_SMOOI_TO_OOP(yv)); hcl_popvolat (hcl); if (!r) return HCL_NULL; *rem = r; } return z; } } if (rem) *rem = HCL_SMOOI_TO_OOP(ri); return z; } } /* carry on to the full bigint division */ hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, yv); hcl_popvolat (hcl); if (!y) return HCL_NULL; } else { if (!hcl_isbigint(hcl,x)) goto oops_einval; if (!hcl_isbigint(hcl,y)) goto oops_einval; } } x_neg_sign = HCL_IS_NBIGINT(hcl, x); y_neg_sign = HCL_IS_NBIGINT(hcl, y); hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = divide_unsigned_integers (hcl, x, y, &r); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; if (x_neg_sign) { /* the class on r must be set before normalize_bigint() * because it can get changed to a small integer */ HCL_OBJ_SET_FLAGS_BRAND (r, HCL_BRAND_NBIGINT); } if (x_neg_sign != y_neg_sign) { HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); hcl_pushvolat (hcl, &z); hcl_pushvolat (hcl, &y); r = normalize_bigint (hcl, r); hcl_popvolats (hcl, 2); if (!r) return HCL_NULL; if (r != HCL_SMOOI_TO_OOP(0) && modulo) { if (rem) { hcl_pushvolat (hcl, &z); hcl_pushvolat (hcl, &y); r = hcl_addints (hcl, r, y); hcl_popvolats (hcl, 2); if (!r) return HCL_NULL; hcl_pushvolat (hcl, &r); z = normalize_bigint (hcl, z); hcl_popvolat (hcl); if (!z) return HCL_NULL; hcl_pushvolat (hcl, &r); z = hcl_subints (hcl, z, HCL_SMOOI_TO_OOP(1)); hcl_popvolat (hcl); if (!z) return HCL_NULL; *rem = r; return z; } else { /* remainder is not needed at all */ /* TODO: subtract 1 without normalization??? */ z = normalize_bigint (hcl, z); if (!z) return HCL_NULL; return hcl_subints (hcl, z, HCL_SMOOI_TO_OOP(1)); } } } else { hcl_pushvolat (hcl, &z); r = normalize_bigint (hcl, r); hcl_popvolat (hcl); if (!r) return HCL_NULL; } hcl_pushvolat (hcl, &r); z = normalize_bigint(hcl, z); hcl_popvolat (hcl); if (z && rem) *rem = r; return z; oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_negateint (hcl_t* hcl, hcl_oop_t x) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); return HCL_SMOOI_TO_OOP(-v); } else { if (!hcl_isbigint(hcl, x)) goto oops_einval; return clone_bigint_negated (hcl, x, HCL_OBJ_GET_SIZE(x)); } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O", x); return HCL_NULL; } hcl_oop_t hcl_bitatint (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { /* y is 0-based */ if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v1, v2, v3; v1 = HCL_OOP_TO_SMOOI(x); v2 = HCL_OOP_TO_SMOOI(y); if (v2 < 0) return HCL_SMOOI_TO_OOP(0); if (v1 >= 0) { /* the absolute value may be composed of up to * HCL_SMOOI_BITS - 1 bits as there is a sign bit.*/ if (v2 >= HCL_SMOOI_BITS - 1) return HCL_SMOOI_TO_OOP(0); v3 = ((hcl_oow_t)v1 >> v2) & 1; } else { if (v2 >= HCL_SMOOI_BITS - 1) return HCL_SMOOI_TO_OOP(1); v3 = ((~(hcl_oow_t)-v1 + 1) >> v2) & 1; } return HCL_SMOOI_TO_OOP(v3); } else if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl, y)) goto oops_einval; if (HCL_IS_NBIGINT(hcl, y)) return HCL_SMOOI_TO_OOP(0); /* y is definitely >= HCL_SMOOI_BITS */ if (HCL_OOP_TO_SMOOI(x) >= 0) return HCL_SMOOI_TO_OOP(0); else return HCL_SMOOI_TO_OOP(1); } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v; hcl_oow_t wp, bp, xs; if (!hcl_isbigint(hcl, x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v < 0) return HCL_SMOOI_TO_OOP(0); wp = v / HCL_LIW_BITS; bp = v - (wp * HCL_LIW_BITS); xs = HCL_OBJ_GET_SIZE(x); if (HCL_IS_PBIGINT(hcl, x)) { if (wp >= xs) return HCL_SMOOI_TO_OOP(0); v = (((hcl_oop_liword_t)x)->slot[wp] >> bp) & 1; } else { hcl_lidw_t w, carry; hcl_oow_t i; if (wp >= xs) return HCL_SMOOI_TO_OOP(1); carry = 1; for (i = 0; i <= wp; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; } v = ((hcl_oow_t)w >> bp) & 1; } return HCL_SMOOI_TO_OOP(v); } else { #if defined(HCL_LIMIT_OBJ_SIZE) /* nothing */ #else hcl_oow_t w, wp, bp, xs; hcl_ooi_t v; int sign; #endif if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; #if defined(HCL_LIMIT_OBJ_SIZE) if (HCL_IS_NBIGINT(hcl, y)) return HCL_SMOOI_TO_OOP(0); HCL_ASSERT (hcl, HCL_OBJ_SIZE_BITS_MAX <= HCL_TYPE_MAX(hcl_oow_t)); if (HCL_IS_PBIGINT(hcl, x)) { return HCL_SMOOI_TO_OOP(0); } else { return HCL_SMOOI_TO_OOP(1); } #else xs = HCL_OBJ_GET_SIZE(x); if (HCL_IS_NBIGINT(hcl, y)) return HCL_SMOOI_TO_OOP(0); sign = bigint_to_oow_noseterr(hcl, y, &w); HCL_ASSERT (hcl, sign >= 0); if (sign >= 1) { wp = w / HCL_LIW_BITS; bp = w - (wp * HCL_LIW_BITS); } else { hcl_oop_t quo, rem; HCL_ASSERT (hcl, sign == 0); hcl_pushvolat (hcl, &x); quo = hcl_divints(hcl, y, HCL_SMOOI_TO_OOP(HCL_LIW_BITS), 0, &rem); hcl_popvolat (hcl); if (!quo) return HCL_NULL; sign = integer_to_oow_noseterr(hcl, quo, &wp); HCL_ASSERT (hcl, sign >= 0); if (sign == 0) { /* too large. set it to xs so that it gets out of * the valid range */ wp = xs; } HCL_ASSERT (hcl, HCL_OOP_IS_SMOOI(rem)); bp = HCL_OOP_TO_SMOOI(rem); HCL_ASSERT (hcl, bp >= 0 && bp < HCL_LIW_BITS); } if (HCL_IS_PBIGINT(hcl, x)) { if (wp >= xs) return HCL_SMOOI_TO_OOP(0); v = (((hcl_oop_liword_t)x)->slot[wp] >> bp) & 1; } else { hcl_lidw_t w, carry; hcl_oow_t i; if (wp >= xs) return HCL_SMOOI_TO_OOP(1); carry = 1; for (i = 0; i <= wp; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; } v = ((hcl_oow_t)w >> bp) & 1; } return HCL_SMOOI_TO_OOP(v); #endif } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_bitandints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v1, v2, v3; v1 = HCL_OOP_TO_SMOOI(x); v2 = HCL_OOP_TO_SMOOI(y); v3 = v1 & v2; if (HCL_IN_SMOOI_RANGE(v3)) return HCL_SMOOI_TO_OOP(v3); return make_bigint_with_ooi (hcl, v3); } else if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) return HCL_SMOOI_TO_OOP(0); hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return HCL_SMOOI_TO_OOP(0); hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else { hcl_oop_t z; hcl_oow_t i, xs, ys, zs, zalloc; int negx, negy; if (!hcl_isbigint(hcl,x) || !hcl_isbigint(hcl, y)) goto oops_einval; bigint_and_bigint: xs = HCL_OBJ_GET_SIZE(x); ys = HCL_OBJ_GET_SIZE(y); if (xs < ys) { /* make sure that x is greater than or equal to y */ z = x; x = y; y = z; zs = ys; ys = xs; xs = zs; } negx = HCL_IS_NBIGINT(hcl, x); negy = HCL_IS_NBIGINT(hcl, y); if (negx && negy) { zalloc = xs + 1; zs = xs; } else if (negx) { zalloc = ys; zs = ys; } else if (negy) { zalloc = xs; zs = xs; } else { zalloc = ys; zs = ys; } hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, zalloc); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; if (negx && negy) { /* both are negative */ hcl_lidw_t w[2]; hcl_lidw_t carry[2]; carry[0] = 1; carry[1] = 1; /* 2's complement on both x and y and perform bitwise-and */ for (i = 0; i < ys; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; w[1] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry[1]; carry[1] = w[1] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0] & (hcl_liw_t)w[1]; } HCL_ASSERT (hcl, carry[1] == 0); /* 2's complement on the remaining part of x. the lacking part * in y is treated as if they are all 1s. */ for (; i < xs; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0]; } HCL_ASSERT (hcl, carry[0] == 0); /* 2's complement on the final result */ ((hcl_oop_liword_t)z)->slot[zs] = ~(hcl_liw_t)0; carry[0] = 1; for (i = 0; i <= zs; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)z)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0]; } HCL_ASSERT (hcl, carry[0] == 0); HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else if (negx) { /* x is negative, y is positive */ hcl_lidw_t w, carry; carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w & ((hcl_oop_liword_t)y)->slot[i]; } /* the lacking part in y is all 0's. the remaining part in x is * just masked out when bitwise-anded with 0. so nothing is done * to handle the remaining part in x */ } else if (negy) { /* x is positive, y is negative */ hcl_lidw_t w, carry; /* x & 2's complement on y up to ys */ carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] & (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); /* handle the longer part in x than y * * For example, * x => + 1010 1100 * y => - 0011 * * If y is extended to the same length as x, * it is a negative 0000 0001. * 2's complement is performed on this imaginary extension. * the result is '1111 1101' (1111 1100 + 1). * * when y is shorter and negative, the lacking part can be * treated as all 1s in the 2's complement format. * * the remaining part in x can be just copied to the * final result 'z'. */ for (; i < xs; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i]; } } else { /* both are positive */ for (i = 0; i < ys; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] & ((hcl_oop_liword_t)y)->slot[i]; } } return normalize_bigint(hcl, z); } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_bitorints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v1, v2, v3; v1 = HCL_OOP_TO_SMOOI(x); v2 = HCL_OOP_TO_SMOOI(y); v3 = v1 | v2; if (HCL_IN_SMOOI_RANGE(v3)) return HCL_SMOOI_TO_OOP(v3); return make_bigint_with_ooi (hcl, v3); } else if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) return clone_bigint(hcl, y, HCL_OBJ_GET_SIZE(y)); hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return clone_bigint(hcl, x, HCL_OBJ_GET_SIZE(x)); hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else { hcl_oop_t z; hcl_oow_t i, xs, ys, zs, zalloc; int negx, negy; if (!hcl_isbigint(hcl,x) || !hcl_isbigint(hcl, y)) goto oops_einval; bigint_and_bigint: xs = HCL_OBJ_GET_SIZE(x); ys = HCL_OBJ_GET_SIZE(y); if (xs < ys) { /* make sure that x is greater than or equal to y */ z = x; x = y; y = z; zs = ys; ys = xs; xs = zs; } negx = HCL_IS_NBIGINT(hcl, x); negy = HCL_IS_NBIGINT(hcl, y); if (negx && negy) { zalloc = ys + 1; zs = ys; } else if (negx) { zalloc = xs + 1; zs = xs; } else if (negy) { zalloc = ys + 1; zs = ys; } else { zalloc = xs; zs = xs; } if (zalloc < zs) { /* overflow in zalloc calculation above */ hcl_seterrnum (hcl, HCL_EOOMEM); /* TODO: is it a soft failure or hard failure? */ return HCL_NULL; } hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, zalloc); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; if (negx && negy) { /* both are negative */ hcl_lidw_t w[2]; hcl_lidw_t carry[2]; carry[0] = 1; carry[1] = 1; /* 2's complement on both x and y and perform bitwise-and */ for (i = 0; i < ys; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; w[1] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry[1]; carry[1] = w[1] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0] | (hcl_liw_t)w[1]; } HCL_ASSERT (hcl, carry[1] == 0); /* do nothing about the extra part in x and the lacking part * in y for the reason shown in [NOTE] in the 'else if' block * further down. */ adjust_to_negative: /* 2's complement on the final result */ ((hcl_oop_liword_t)z)->slot[zs] = ~(hcl_liw_t)0; carry[0] = 1; for (i = 0; i <= zs; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)z)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0]; } HCL_ASSERT (hcl, carry[0] == 0); HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else if (negx) { /* x is negative, y is positive */ hcl_lidw_t w, carry; carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w | ((hcl_oop_liword_t)y)->slot[i]; } for (; i < xs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); goto adjust_to_negative; } else if (negy) { /* x is positive, y is negative */ hcl_lidw_t w, carry; /* x & 2's complement on y up to ys */ carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] | (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); /* [NOTE] * in theory, the lacking part in ys is all 1s when y is * extended to the width of x. but those 1s are inverted to * 0s when another 2's complement is performed over the final * result after the jump to 'adjust_to_negative'. * setting zs to 'xs + 1' and performing the following loop is * redundant. for (; i < xs; i++) { ((hcl_oop_liword_t)z)->slot[i] = ~(hcl_liw_t)0; } */ goto adjust_to_negative; } else { /* both are positive */ for (i = 0; i < ys; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] | ((hcl_oop_liword_t)y)->slot[i]; } for (; i < xs; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i]; } } return normalize_bigint(hcl, z); } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_bitxorints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v1, v2, v3; v1 = HCL_OOP_TO_SMOOI(x); v2 = HCL_OOP_TO_SMOOI(y); v3 = v1 ^ v2; if (HCL_IN_SMOOI_RANGE(v3)) return HCL_SMOOI_TO_OOP(v3); return make_bigint_with_ooi (hcl, v3); } else if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) return clone_bigint(hcl, y, HCL_OBJ_GET_SIZE(y)); hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v; if (!hcl_isbigint(hcl, x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return clone_bigint(hcl, x, HCL_OBJ_GET_SIZE(x)); hcl_pushvolat (hcl, &x); y = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else { hcl_oop_t z; hcl_oow_t i, xs, ys, zs, zalloc; int negx, negy; if (!hcl_isbigint(hcl,x) || !hcl_isbigint(hcl, y)) goto oops_einval; bigint_and_bigint: xs = HCL_OBJ_GET_SIZE(x); ys = HCL_OBJ_GET_SIZE(y); if (xs < ys) { /* make sure that x is greater than or equal to y */ z = x; x = y; y = z; zs = ys; ys = xs; xs = zs; } negx = HCL_IS_NBIGINT(hcl, x); negy = HCL_IS_NBIGINT(hcl, y); if (negx && negy) { zalloc = xs; zs = xs; } else if (negx) { zalloc = xs + 1; zs = xs; } else if (negy) { zalloc = xs + 1; zs = xs; } else { zalloc = xs; zs = xs; } if (zalloc < zs) { /* overflow in zalloc calculation above */ hcl_seterrnum (hcl, HCL_EOOMEM); /* TODO: is it a soft failure or hard failure? */ return HCL_NULL; } hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &y); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, zalloc); hcl_popvolats (hcl, 2); if (!z) return HCL_NULL; if (negx && negy) { /* both are negative */ hcl_lidw_t w[2]; hcl_lidw_t carry[2]; carry[0] = 1; carry[1] = 1; /* 2's complement on both x and y and perform bitwise-and */ for (i = 0; i < ys; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; w[1] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry[1]; carry[1] = w[1] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0] ^ (hcl_liw_t)w[1]; } HCL_ASSERT (hcl, carry[1] == 0); /* treat the lacking part in y as all 1s */ for (; i < xs; i++) { w[0] = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry[0]; carry[0] = w[0] >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w[0] ^ (~(hcl_liw_t)0); } HCL_ASSERT (hcl, carry[0] == 0); } else if (negx) { /* x is negative, y is positive */ hcl_lidw_t w, carry; carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w ^ ((hcl_oop_liword_t)y)->slot[i]; } /* treat the lacking part in y as all 0s */ for (; i < xs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); adjust_to_negative: /* 2's complement on the final result */ ((hcl_oop_liword_t)z)->slot[zs] = ~(hcl_liw_t)0; carry = 1; for (i = 0; i <= zs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)z)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } else if (negy) { /* x is positive, y is negative */ hcl_lidw_t w, carry; /* x & 2's complement on y up to ys */ carry = 1; for (i = 0; i < ys; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)y)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] ^ (hcl_liw_t)w; } HCL_ASSERT (hcl, carry == 0); /* treat the lacking part in y as all 1s */ for (; i < xs; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] ^ (~(hcl_liw_t)0); } goto adjust_to_negative; } else { /* both are positive */ for (i = 0; i < ys; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i] ^ ((hcl_oop_liword_t)y)->slot[i]; } /* treat the lacking part in y as all 0s */ for (; i < xs; i++) { ((hcl_oop_liword_t)z)->slot[i] = ((hcl_oop_liword_t)x)->slot[i]; } } return normalize_bigint(hcl, z); } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_bitinvint (hcl_t* hcl, hcl_oop_t x) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); v = ~v; if (HCL_IN_SMOOI_RANGE(v)) return HCL_SMOOI_TO_OOP(v); return make_bigint_with_ooi (hcl, v); } else { hcl_oop_t z; hcl_oow_t i, xs, zs, zalloc; int negx; if (!hcl_isbigint(hcl,x)) goto oops_einval; xs = HCL_OBJ_GET_SIZE(x); negx = HCL_IS_NBIGINT(hcl, x); if (negx) { zalloc = xs; zs = xs; } else { zalloc = xs + 1; zs = xs; } if (zalloc < zs) { /* overflow in zalloc calculation above */ hcl_seterrnum (hcl, HCL_EOOMEM); /* TODO: is it a soft failure or hard failure? */ return HCL_NULL; } hcl_pushvolat (hcl, &x); z = hcl_makebigint(hcl, HCL_BRAND_PBIGINT, HCL_NULL, zalloc); hcl_popvolat (hcl); if (!z) return HCL_NULL; if (negx) { hcl_lidw_t w, carry; carry = 1; for (i = 0; i < xs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~HCL_OBJ_GET_LIWORD_VAL(x, i)) + carry; carry = w >> HCL_LIW_BITS; HCL_OBJ_SET_LIWORD_VAL (z, i, ~(hcl_liw_t)w); } HCL_ASSERT (hcl, carry == 0); } else { hcl_lidw_t w, carry; #if 0 for (i = 0; i < xs; i++) { HCL_OBJ_SET_LIWORD_VAL (z, i, ~HCL_OBJ_GET_LIWORD_VAL(x, i)); } HCL_OBJ_SET_LIWORD_VAL (z, zs, ~(hcl_liw_t)0); carry = 1; for (i = 0; i <= zs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~HCL_OBJ_GET_LIWORD_VAL(z, i)) + carry; carry = w >> HCL_LIW_BITS; HCL_OBJ_SET_LIWORD_VAL (z, i, (hcl_liw_t)w); } HCL_ASSERT (hcl, carry == 0); #else carry = 1; for (i = 0; i < xs; i++) { w = (hcl_lidw_t)(HCL_OBJ_GET_LIWORD_VAL(x, i)) + carry; carry = w >> HCL_LIW_BITS; HCL_OBJ_SET_LIWORD_VAL (z, i, (hcl_liw_t)w); } HCL_ASSERT (hcl, i == zs); HCL_OBJ_SET_LIWORD_VAL (z, i, (hcl_liw_t)carry); HCL_ASSERT (hcl, (carry >> HCL_LIW_BITS) == 0); #endif HCL_OBJ_SET_FLAGS_BRAND (z, HCL_BRAND_NBIGINT); } return normalize_bigint(hcl, z); } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O", x); return HCL_NULL; } static HCL_INLINE hcl_oop_t rshift_negative_bigint (hcl_t* hcl, hcl_oop_t x, hcl_oow_t shift) { hcl_oop_t z; hcl_lidw_t w; hcl_lidw_t carry; hcl_oow_t i, xs; HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, x)); xs = HCL_OBJ_GET_SIZE(x); hcl_pushvolat (hcl, &x); /* +1 for the second inversion below */ z = hcl_makebigint(hcl, HCL_BRAND_NBIGINT, HCL_NULL, xs + 1); hcl_popvolat (hcl); if (!z) return HCL_NULL; /* the following lines roughly for 'z = hcl_bitinv (hcl, x)' */ carry = 1; for (i = 0; i < xs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)x)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; HCL_OBJ_SET_LIWORD_VAL (z, i, ~(hcl_liw_t)w); } HCL_ASSERT (hcl, carry == 0); /* shift to the right */ rshift_unsigned_array (((hcl_oop_liword_t)z)->slot, xs, shift); /* the following lines roughly for 'z = hcl_bitinv (hcl, z)' */ #if 0 for (i = 0; i < xs; i++) { HCL_OBJ_SET_LIWORD_VAL (z, i, ~HCL_OBJ_GET_LIWORD_VAL(z, i)); } HCL_OBJ_SET_LIWORD_VAL (z, xs, ~(hcl_liw_t)0); carry = 1; for (i = 0; i <= xs; i++) { w = (hcl_lidw_t)((hcl_liw_t)~((hcl_oop_liword_t)z)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; HCL_OBJ_SET_LIWORD_VAL (z, i, (hcl_liw_t)w); } HCL_ASSERT (hcl, carry == 0); #else carry = 1; for (i = 0; i < xs; i++) { w = (hcl_lidw_t)(((hcl_oop_liword_t)z)->slot[i]) + carry; carry = w >> HCL_LIW_BITS; ((hcl_oop_liword_t)z)->slot[i] = (hcl_liw_t)w; } HCL_OBJ_SET_LIWORD_VAL (z, i, (hcl_liw_t)carry); HCL_ASSERT (hcl, (carry >> HCL_LIW_BITS) == 0); #endif return z; /* z is not normalized */ } #if defined(HCL_LIMIT_OBJ_SIZE) /* nothing */ #else static HCL_INLINE hcl_oop_t rshift_negative_bigint_and_normalize (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; hcl_oow_t shift; int sign; HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, x)); HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, y)); /* for convenience in subtraction below. * it could be HCL_TYPE_MAX(hcl_oow_t) * if make_bigint_with_intmax() or something * similar were used instead of HCL_SMOOI_TO_OOP().*/ shift = HCL_SMOOI_MAX; do { hcl_pushvolat (hcl, &y); z = rshift_negative_bigint (hcl, x, shift); hcl_popvolat (hcl); if (!z) return HCL_NULL; /* y is a negative number. use hcl_addints() until it becomes 0 */ hcl_pushvolat (hcl, &z); y = hcl_addints (hcl, y, HCL_SMOOI_TO_OOP(shift)); hcl_popvolat (hcl); if (!y) return HCL_NULL; sign = integer_to_oow_noseterr(hcl, y, &shift); if (sign == 0) shift = HCL_SMOOI_MAX; else { if (shift == 0) { /* no more shift */ return normalize_bigint (hcl, z); } HCL_ASSERT (hcl, sign <= -1); } hcl_pushvolat (hcl, &y); x = normalize_bigint (hcl, z); hcl_popvolat (hcl); if (!x) return HCL_NULL; if (HCL_OOP_IS_SMOOI(x)) { /* for normaization above, x can become a small integer */ hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); HCL_ASSERT (hcl, v < 0); /* normal right shift of a small negative integer */ if (shift >= HCL_OOI_BITS - 1) { /* when y is still a large integer, this condition is met * met as HCL_SMOOI_MAX > HCL_OOI_BITS. so i can simly * terminate the loop after this */ return HCL_SMOOI_TO_OOP(-1); } else { v = (hcl_ooi_t)(((hcl_oow_t)v >> shift) | HCL_HBMASK(hcl_oow_t, shift)); if (HCL_IN_SMOOI_RANGE(v)) return HCL_SMOOI_TO_OOP(v); else return make_bigint_with_ooi (hcl, v); } } } while (1); /* this part must not be reached */ HCL_ASSERT (hcl, !"internal error - must not happen"); hcl_seterrnum (hcl, HCL_EINTERN); return HCL_NULL; } static HCL_INLINE hcl_oop_t rshift_positive_bigint_and_normalize (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; hcl_oow_t zs, shift; int sign; HCL_ASSERT (hcl, HCL_IS_PBIGINT(hcl, x)); HCL_ASSERT (hcl, HCL_IS_NBIGINT(hcl, y)); zs = HCL_OBJ_GET_SIZE(x); hcl_pushvolat (hcl, &y); z = clone_bigint (hcl, x, zs); hcl_popvolat (hcl); if (!z) return HCL_NULL; /* for convenience in subtraction below. * it could be HCL_TYPE_MAX(hcl_oow_t) * if make_bigint_with_intmax() or something * similar were used instead of HCL_SMOOI_TO_OOP().*/ shift = HCL_SMOOI_MAX; do { rshift_unsigned_array (((hcl_oop_liword_t)z)->slot, zs, shift); if (count_effective (((hcl_oop_liword_t)z)->slot, zs) == 1 && HCL_OBJ_GET_LIWORD_VAL(z, 0) == 0) { /* if z is 0, i don't have to go on */ break; } /* y is a negative number. use hcl_addints() until it becomes 0 */ hcl_pushvolat (hcl, &z); y = hcl_addints(hcl, y, HCL_SMOOI_TO_OOP(shift)); hcl_popvolat (hcl); if (!y) return HCL_NULL; sign = integer_to_oow_noseterr(hcl, y, &shift); if (sign == 0) shift = HCL_SMOOI_MAX; else { if (shift == 0) break; HCL_ASSERT (hcl, sign <= -1); } } while (1); return normalize_bigint(hcl, z); } static HCL_INLINE hcl_oop_t lshift_bigint_and_normalize (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { hcl_oop_t z; hcl_oow_t wshift, shift; int sign; HCL_ASSERT (hcl, HCL_IS_PBIGINT(hcl, y)); /* this loop is very inefficient as shifting is repeated * with lshift_unsigned_array(). however, this part of the * code is not likey to be useful because the amount of * memory available is certainly not enough to support * huge shifts greater than HCL_TYPE_MAX(hcl_oow_t) */ shift = HCL_SMOOI_MAX; do { /* for convenience only in subtraction below. * should it be between HCL_SMOOI_MAX and HCL_TYPE_MAX(hcl_oow_t), * the second parameter to hcl_subints() can't be composed * using HCL_SMOOI_TO_OOP() */ wshift = shift / HCL_LIW_BITS; if (shift > wshift * HCL_LIW_BITS) wshift++; hcl_pushvolat (hcl, &y); z = expand_bigint (hcl, x, wshift); hcl_popvolat (hcl); if (!z) return HCL_NULL; lshift_unsigned_array (((hcl_oop_liword_t)z)->slot, HCL_OBJ_GET_SIZE(z), shift); hcl_pushvolat (hcl, &y); x = normalize_bigint(hcl, z); hcl_popvolat (hcl); if (!x) return HCL_NULL; hcl_pushvolat (hcl, &x); y = hcl_subints(hcl, y, HCL_SMOOI_TO_OOP(shift)); hcl_popvolat (hcl); if (!y) return HCL_NULL; sign = integer_to_oow_noseterr(hcl, y, &shift); if (sign == 0) shift = HCL_SMOOI_MAX; else { if (shift == 0) { HCL_ASSERT (hcl, is_normalized_integer(hcl, x)); return x; } HCL_ASSERT (hcl, sign >= 1); } } while (1); /* this part must not be reached */ HCL_ASSERT (hcl, !"internal error - must not happen"); hcl_seterrnum (hcl, HCL_EINTERN); return HCL_NULL; } #endif hcl_oop_t hcl_bitshiftint (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { /* left shift if y is positive, * right shift if y is negative */ if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v1, v2; v1 = HCL_OOP_TO_SMOOI(x); v2 = HCL_OOP_TO_SMOOI(y); if (v1 == 0 || v2 == 0) { /* return without cloning as x is a small integer */ return x; } if (v2 > 0) { /* left shift */ hcl_oop_t z; hcl_oow_t wshift; wshift = v2 / HCL_LIW_BITS; if (v2 > wshift * HCL_LIW_BITS) wshift++; z = make_bloated_bigint_with_ooi (hcl, v1, wshift); if (!z) return HCL_NULL; lshift_unsigned_array (((hcl_oop_liword_t)z)->slot, HCL_OBJ_GET_SIZE(z), v2); return normalize_bigint (hcl, z); } else { /* right shift */ hcl_ooi_t v; v2 = -v2; if (v1 < 0) { /* guarantee arithmetic shift preserving the sign bit * regardless of compiler implementation. * * binary decimal shifted by * ------------------------------- * 10000011 (-125) 0 * 11000001 (-63) 1 * 11100000 (-32) 2 * 11110000 (-16) 3 * 11111000 (-8) 4 * 11111100 (-4) 5 * 11111110 (-2) 6 * 11111111 (-1) 7 * 11111111 (-1) 8 */ if (v2 >= HCL_OOI_BITS - 1) v = -1; else { /* HCL_HBMASK_SAFE(hcl_oow_t, v2 + 1) could also be * used as a mask. but the sign bit is shifted in. * so, masking up to 'v2' bits is sufficient */ v = (hcl_ooi_t)(((hcl_oow_t)v1 >> v2) | HCL_HBMASK(hcl_oow_t, v2)); } } else { if (v2 >= HCL_OOI_BITS) v = 0; else v = v1 >> v2; } if (HCL_IN_SMOOI_RANGE(v)) return HCL_SMOOI_TO_OOP(v); return make_bigint_with_ooi (hcl, v); } } else { int sign, negx, negy; hcl_oow_t shift; if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; if (!hcl_isbigint(hcl,y)) goto oops_einval; v = HCL_OOP_TO_SMOOI(x); if (v == 0) return HCL_SMOOI_TO_OOP(0); if (HCL_IS_NBIGINT(hcl, y)) { /* right shift - special case. * x is a small integer. it is just a few bytes long. * y is a large negative integer. its smallest absolute value * is HCL_SMOOI_MAX. i know the final answer. */ return (v < 0)? HCL_SMOOI_TO_OOP(-1): HCL_SMOOI_TO_OOP(0); } hcl_pushvolat (hcl, &y); x = make_bigint_with_ooi (hcl, v); hcl_popvolat (hcl); if (!x) return HCL_NULL; goto bigint_and_bigint; } else if (HCL_OOP_IS_SMOOI(y)) { hcl_ooi_t v; if (!hcl_isbigint(hcl,x)) goto oops_einval; v = HCL_OOP_TO_SMOOI(y); if (v == 0) return clone_bigint (hcl, x, HCL_OBJ_GET_SIZE(x)); negx = HCL_IS_NBIGINT(hcl, x); if (v > 0) { sign = 1; negy = 0; shift = v; goto bigint_and_positive_oow; } else { sign = -1; negy = 1; shift = -v; goto bigint_and_negative_oow; } } else { hcl_oop_t z; if (!hcl_isbigint(hcl,x) || !hcl_isbigint(hcl, y)) goto oops_einval; bigint_and_bigint: negx = HCL_IS_NBIGINT(hcl, x); negy = HCL_IS_NBIGINT(hcl, y); sign = bigint_to_oow_noseterr(hcl, y, &shift); if (sign == 0) { /* y is too big or too small */ if (negy) { /* right shift */ #if defined(HCL_LIMIT_OBJ_SIZE) /* the maximum number of bit shifts are guaranteed to be * small enough to fit into the hcl_oow_t type. so i can * easily assume that all bits are shifted out */ HCL_ASSERT (hcl, HCL_OBJ_SIZE_BITS_MAX <= HCL_TYPE_MAX(hcl_oow_t)); return (negx)? HCL_SMOOI_TO_OOP(-1): HCL_SMOOI_TO_OOP(0); #else if (negx) return rshift_negative_bigint_and_normalize (hcl, x, y); else return rshift_positive_bigint_and_normalize (hcl, x, y); #endif } else { /* left shift */ #if defined(HCL_LIMIT_OBJ_SIZE) /* the maximum number of bit shifts are guaranteed to be * small enough to fit into the hcl_oow_t type. so i can * simply return a failure here becuase it's surely too * large after shifting */ HCL_ASSERT (hcl, HCL_TYPE_MAX(hcl_oow_t) >= HCL_OBJ_SIZE_BITS_MAX); hcl_seterrnum (hcl, HCL_EOOMEM); /* is it a soft failure or a hard failure? is this error code proper? */ return HCL_NULL; #else return lshift_bigint_and_normalize (hcl, x, y); #endif } } else if (sign >= 1) { /* left shift */ hcl_oow_t wshift; bigint_and_positive_oow: wshift = shift / HCL_LIW_BITS; if (shift > wshift * HCL_LIW_BITS) wshift++; z = expand_bigint (hcl, x, wshift); if (!z) return HCL_NULL; lshift_unsigned_array (((hcl_oop_liword_t)z)->slot, HCL_OBJ_GET_SIZE(z), shift); } else { /* right shift */ bigint_and_negative_oow: HCL_ASSERT (hcl, sign <= -1); if (negx) { z = rshift_negative_bigint (hcl, x, shift); if (!z) return HCL_NULL; } else { z = clone_bigint (hcl, x, HCL_OBJ_GET_SIZE(x)); if (!z) return HCL_NULL; rshift_unsigned_array (((hcl_oop_liword_t)z)->slot, HCL_OBJ_GET_SIZE(z), shift); } } return normalize_bigint(hcl, z); } } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } static hcl_uint8_t ooch_val_tab[] = { 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 99, 99, 99, 99, 99, 99, 99, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 99, 99, 99, 99, 99, 99, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 99, 99, 99, 99, 99 }; hcl_oop_t hcl_strtoint (hcl_t* hcl, const hcl_ooch_t* str, hcl_oow_t len, int radix) { int sign = 1; const hcl_ooch_t* ptr, * start, * end; hcl_lidw_t w, v; hcl_liw_t hw[16], * hwp = HCL_NULL; hcl_oow_t hwlen, outlen; hcl_oop_t res; if (radix < 0) { /* when radix is less than 0, it treats it as if '-' is preceeding */ sign = -1; radix = -radix; } HCL_ASSERT (hcl, radix >= 2 && radix <= 36); ptr = str; end = str + len; if (ptr < end) { if (*ptr == '+') ptr++; else if (*ptr == '-') { ptr++; sign = -1; } } if (ptr >= end) goto oops_einval; /* no digits */ while (ptr < end && *ptr == '0') { /* skip leading zeros */ ptr++; } if (ptr >= end) { /* all zeros */ return HCL_SMOOI_TO_OOP(0); } hwlen = 0; start = ptr; /* this is the real start */ if (IS_POW2(radix)) { unsigned int exp; unsigned int bitcnt; /* get log2(radix) in a fast way under the fact that * radix is a power of 2. the exponent acquired is * the number of bits that a digit of the given radix takes up */ /*exp = LOG2_FOR_POW2(radix);*/ exp = _exp_tab[radix - 1]; /* bytes */ outlen = ((hcl_oow_t)(end - str) * exp + 7) / 8; /* number of hcl_liw_t */ outlen = (outlen + HCL_SIZEOF(hw[0]) - 1) / HCL_SIZEOF(hw[0]); if (outlen > HCL_COUNTOF(hw)) { hwp = (hcl_liw_t*)hcl_allocmem(hcl, outlen * HCL_SIZEOF(hw[0])); if (!hwp) return HCL_NULL; } else { hwp = hw; } w = 0; bitcnt = 0; ptr = end - 1; while (ptr >= start) { if (*ptr < 0 || *ptr >= HCL_COUNTOF(ooch_val_tab)) goto oops_einval; v = ooch_val_tab[*ptr]; if (v >= radix) goto oops_einval; w |= (v << bitcnt); bitcnt += exp; if (bitcnt >= HCL_LIW_BITS) { bitcnt -= HCL_LIW_BITS; hwp[hwlen++] = w; /*(hcl_liw_t)(w & HCL_LBMASK(hcl_lidw_t, HCL_LIW_BITS));*/ w >>= HCL_LIW_BITS; } ptr--; } HCL_ASSERT (hcl, w <= HCL_TYPE_MAX(hcl_liw_t)); if (hwlen == 0 || w > 0) hwp[hwlen++] = w; } else { hcl_lidw_t r1, r2; hcl_liw_t multiplier; int dg, i, safe_ndigits; w = 0; ptr = start; safe_ndigits = hcl->bigint[radix].safe_ndigits; multiplier = (hcl_liw_t)hcl->bigint[radix].multiplier; outlen = (end - str) / safe_ndigits + 1; if (outlen > HCL_COUNTOF(hw)) { hwp = (hcl_liw_t*)hcl_allocmem(hcl, outlen * HCL_SIZEOF(hcl_liw_t)); if (!hwp) return HCL_NULL; } else { hwp = hw; } HCL_ASSERT (hcl, ptr < end); do { r1 = 0; for (dg = 0; dg < safe_ndigits; dg++) { if (ptr >= end) { multiplier = 1; for (i = 0; i < dg; i++) multiplier *= radix; break; } if (*ptr < 0 || *ptr >= HCL_COUNTOF(ooch_val_tab)) goto oops_einval; v = ooch_val_tab[*ptr]; if (v >= radix) goto oops_einval; r1 = r1 * radix + (hcl_liw_t)v; ptr++; } r2 = r1; for (i = 0; i < hwlen; i++) { hcl_liw_t high, low; v = (hcl_lidw_t)hwp[i] * multiplier; high = (hcl_liw_t)(v >> HCL_LIW_BITS); low = (hcl_liw_t)(v /*& HCL_LBMASK(hcl_oow_t, HCL_LIW_BITS)*/); #if defined(liw_add_overflow) /* use liw_add_overflow() only if it's compiler-builtin. */ r2 = high + liw_add_overflow(low, r2, &low); #else /* don't use the fall-back version of liw_add_overflow() */ low += r2; r2 = (hcl_lidw_t)high + (low < r2); #endif hwp[i] = low; } if (r2) hwp[hwlen++] = (hcl_liw_t)r2; } while (ptr < end); } HCL_ASSERT (hcl, hwlen >= 1); #if (HCL_LIW_BITS == HCL_OOW_BITS) if (hwlen == 1) { w = hwp[0]; HCL_ASSERT (hcl, -HCL_SMOOI_MAX == HCL_SMOOI_MIN); if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP((hcl_ooi_t)w * sign); } #elif (HCL_LIW_BITS == HCL_OOHW_BITS) if (hwlen == 1) { HCL_ASSERT (hcl, hwp[0] <= HCL_SMOOI_MAX); return HCL_SMOOI_TO_OOP((hcl_ooi_t)hwp[0] * sign); } else if (hwlen == 2) { w = MAKE_WORD(hwp[0], hwp[1]); HCL_ASSERT (hcl, -HCL_SMOOI_MAX == HCL_SMOOI_MIN); if (w <= HCL_SMOOI_MAX) return HCL_SMOOI_TO_OOP((hcl_ooi_t)w * sign); } #else # error UNSUPPORTED LIW BIT SIZE #endif res = hcl_makebigint(hcl, (sign < 0? HCL_BRAND_NBIGINT: HCL_BRAND_PBIGINT), hwp, hwlen); if (hwp && hw != hwp) hcl_freemem (hcl, hwp); return res; oops_einval: if (hwp && hw != hwp) hcl_freemem (hcl, hwp); hcl_seterrnum (hcl, HCL_EINVAL); return HCL_NULL; } static hcl_oow_t oow_to_text (hcl_t* hcl, hcl_oow_t w, int flagged_radix, hcl_ooch_t* buf) { hcl_ooch_t* ptr; const char* _digitc; int radix; radix = flagged_radix & HCL_INTTOSTR_RADIXMASK; _digitc = _digitc_array[!!(flagged_radix & HCL_INTTOSTR_LOWERCASE)]; HCL_ASSERT (hcl, radix >= 2 && radix <= 36); ptr = buf; do { *ptr++ = _digitc[w % radix]; w /= radix; } while (w > 0); return ptr - buf; } static void reverse_string (hcl_ooch_t* str, hcl_oow_t len) { hcl_ooch_t ch; hcl_ooch_t* start = str; hcl_ooch_t* end = str + len - 1; while (start < end) { ch = *start; *start++ = *end; *end-- = ch; } } hcl_oop_t hcl_eqints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) == HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x) || HCL_OOP_IS_SMOOI(y)) { return hcl->_false; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return is_equal(hcl, x, y)? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_neints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) != HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x) || HCL_OOP_IS_SMOOI(y)) { return hcl->_true; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return !is_equal(hcl, x, y)? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_gtints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) > HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl, y)) goto oops_einval; return (HCL_IS_NBIGINT(hcl, y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl, x)) goto oops_einval; return (HCL_IS_PBIGINT(hcl, x))? hcl->_true: hcl->_false; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return is_greater(hcl, x, y)? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_geints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) >= HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl, y)) goto oops_einval; return (HCL_IS_NBIGINT(hcl, y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl, x)) goto oops_einval; return (HCL_IS_PBIGINT(hcl, x))? hcl->_true: hcl->_false; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return (is_greater(hcl, x, y) || is_equal(hcl, x, y))? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_ltints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) < HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl, y)) goto oops_einval; return (HCL_IS_PBIGINT(hcl, y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl, x)) goto oops_einval; return (HCL_IS_NBIGINT(hcl, x))? hcl->_true: hcl->_false; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return is_less(hcl, x, y)? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_leints (hcl_t* hcl, hcl_oop_t x, hcl_oop_t y) { if (HCL_OOP_IS_SMOOI(x) && HCL_OOP_IS_SMOOI(y)) { return (HCL_OOP_TO_SMOOI(x) <= HCL_OOP_TO_SMOOI(y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(x)) { if (!hcl_isbigint(hcl, y)) goto oops_einval; return (HCL_IS_PBIGINT(hcl, y))? hcl->_true: hcl->_false; } else if (HCL_OOP_IS_SMOOI(y)) { if (!hcl_isbigint(hcl, x)) goto oops_einval; return (HCL_IS_NBIGINT(hcl, x))? hcl->_true: hcl->_false; } else { if (!hcl_isbigint(hcl, x) || !hcl_isbigint(hcl, y)) goto oops_einval; return (is_less(hcl, x, y) || is_equal(hcl, x, y))? hcl->_true: hcl->_false; } oops_einval: hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O, %O", x, y); return HCL_NULL; } hcl_oop_t hcl_sqrtint (hcl_t* hcl, hcl_oop_t x) { /* TODO: find a faster and more efficient algorithm??? */ hcl_oop_t a, b, m, m2, t; int neg; if (!hcl_isint(hcl, x)) { hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O", x); return HCL_NULL; } a = hcl->_nil; b = hcl->_nil; m = hcl->_nil; m2 = hcl->_nil; hcl_pushvolat (hcl, &x); hcl_pushvolat (hcl, &a); hcl_pushvolat (hcl, &b); hcl_pushvolat (hcl, &m); hcl_pushvolat (hcl, &m2); a = hcl_ltints(hcl, x, HCL_SMOOI_TO_OOP(0)); if (!a) goto oops; if (a == hcl->_true) { /* the given number is a negative number. * i will arrange the return value to be negative. */ x = hcl_negateint(hcl, x); if (!x) goto oops; neg = 1; } else neg = 0; a = HCL_SMOOI_TO_OOP(1); b = hcl_bitshiftint(hcl, x, HCL_SMOOI_TO_OOP(-5)); if (!b) goto oops; b = hcl_addints(hcl, b, HCL_SMOOI_TO_OOP(8)); if (!b) goto oops; while (1) { t = hcl_geints(hcl, b, a); if (!t) return HCL_NULL; if (t == hcl->_false) break; m = hcl_addints(hcl, a, b); if (!m) goto oops; m = hcl_bitshiftint(hcl, m, HCL_SMOOI_TO_OOP(-1)); if (!m) goto oops; m2 = hcl_mulints(hcl, m, m); if (!m2) goto oops; t = hcl_gtints(hcl, m2, x); if (!t) return HCL_NULL; if (t == hcl->_true) { b = hcl_subints(hcl, m, HCL_SMOOI_TO_OOP(1)); if (!b) goto oops; } else { a = hcl_addints(hcl, m, HCL_SMOOI_TO_OOP(1)); if (!a) goto oops; } } hcl_popvolats (hcl, 5); x = hcl_subints(hcl, a, HCL_SMOOI_TO_OOP(1)); if (!x) return HCL_NULL; if (neg) x = hcl_negateint(hcl, x); return x; oops: hcl_popvolats (hcl, 5); return HCL_NULL; } hcl_oop_t hcl_absint (hcl_t* hcl, hcl_oop_t x) { if (HCL_OOP_IS_SMOOI(x)) { hcl_ooi_t v; v = HCL_OOP_TO_SMOOI(x); if (v < 0) { v = -v; x = HCL_SMOOI_TO_OOP(v); } } else if (HCL_IS_NBIGINT(hcl, x)) { x = _clone_bigint(hcl, x, HCL_OBJ_GET_SIZE(x), HCL_BRAND_PBIGINT); } else if (HCL_IS_PBIGINT(hcl, x)) { /* do nothing. return x without change. * [THINK] but do i need to clone a positive bigint? */ } else { hcl_seterrbfmt (hcl, HCL_EINVAL, "not integer - %O", x); return HCL_NULL; } return x; } static HCL_INLINE hcl_liw_t get_last_digit (hcl_t* hcl, hcl_liw_t* x, hcl_oow_t* xs, int radix) { /* this function changes the contents of the large integer word array */ hcl_oow_t oxs = *xs; hcl_liw_t carry = 0; hcl_oow_t i; hcl_lidw_t dw; HCL_ASSERT (hcl, oxs > 0); for (i = oxs; i > 0; ) { --i; dw = ((hcl_lidw_t)carry << HCL_LIW_BITS) + x[i]; /* TODO: optimize it with ASM - no seperate / and % */ x[i] = (hcl_liw_t)(dw / radix); carry = (hcl_liw_t)(dw % radix); } if (/*oxs > 0 &&*/ x[oxs - 1] == 0) *xs = oxs - 1; return carry; } hcl_oop_t hcl_inttostr (hcl_t* hcl, hcl_oop_t num, int flagged_radix) { hcl_ooi_t v = 0; hcl_oow_t w; hcl_oow_t as; hcl_liw_t* t = HCL_NULL; hcl_ooch_t* xbuf = HCL_NULL; hcl_oow_t xlen = 0, reqcapa; int radix; const char* _digitc; radix = flagged_radix & HCL_INTTOSTR_RADIXMASK; _digitc = _digitc_array[!!(flagged_radix & HCL_INTTOSTR_LOWERCASE)]; HCL_ASSERT (hcl, radix >= 2 && radix <= 36); if (!hcl_isint(hcl,num)) goto oops_einval; v = integer_to_oow_noseterr(hcl, num, &w); if (v) { /* The largest buffer is required for radix 2. * For a binary conversion(radix 2), the number of bits is * the maximum number of digits that can be produced. +1 is * needed for the sign. */ reqcapa = HCL_OOW_BITS + 1; if (hcl->inttostr.xbuf.capa < reqcapa) { xbuf = (hcl_ooch_t*)hcl_reallocmem(hcl, hcl->inttostr.xbuf.ptr, reqcapa * HCL_SIZEOF(*xbuf)); if (!xbuf) return HCL_NULL; hcl->inttostr.xbuf.capa = reqcapa; hcl->inttostr.xbuf.ptr = xbuf; } else { xbuf = hcl->inttostr.xbuf.ptr; } xlen = oow_to_text(hcl, w, flagged_radix, xbuf); if (v < 0) xbuf[xlen++] = '-'; reverse_string (xbuf, xlen); if (flagged_radix & HCL_INTTOSTR_NONEWOBJ) { /* special case. don't create a new object. * the caller can use the data left in hcl->inttostr.xbuf */ hcl->inttostr.xbuf.len = xlen; return hcl->_nil; } return hcl_makestring(hcl, xbuf, xlen); } as = HCL_OBJ_GET_SIZE(num); reqcapa = as * HCL_LIW_BITS + 1; if (hcl->inttostr.xbuf.capa < reqcapa) { xbuf = (hcl_ooch_t*)hcl_reallocmem(hcl, hcl->inttostr.xbuf.ptr, reqcapa * HCL_SIZEOF(*xbuf)); if (!xbuf) return HCL_NULL; hcl->inttostr.xbuf.capa = reqcapa; hcl->inttostr.xbuf.ptr = xbuf; } else { xbuf = hcl->inttostr.xbuf.ptr; } if (hcl->inttostr.t.capa < as) { t = (hcl_liw_t*)hcl_reallocmem(hcl, hcl->inttostr.t.ptr, reqcapa * HCL_SIZEOF(*t)); if (!t) return HCL_NULL; hcl->inttostr.t.capa = as; hcl->inttostr.t.ptr = t; } else { t = hcl->inttostr.t.ptr; } HCL_MEMCPY (t, ((hcl_oop_liword_t)num)->slot, HCL_SIZEOF(*t) * as); do { hcl_liw_t dv = get_last_digit(hcl, t, &as, radix); xbuf[xlen++] = _digitc[dv]; } while (as > 0); if (HCL_IS_NBIGINT(hcl, num)) xbuf[xlen++] = '-'; reverse_string (xbuf, xlen); if (flagged_radix & HCL_INTTOSTR_NONEWOBJ) { /* special case. don't create a new object. * the caller can use the data left in hcl->inttostr.xbuf */ hcl->inttostr.xbuf.len = xlen; return hcl->_nil; } return hcl_makestring(hcl, xbuf, xlen); oops_einval: hcl_seterrnum (hcl, HCL_EINVAL); return HCL_NULL; }