/*************************************************************************** gbx_number.c (c) 2000-2017 BenoƮt Minisini This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. ***************************************************************************/ #define __GBX_NUMBER_C #include "gb_common.h" #include "gb_error.h" #include "gb_limit.h" #include #include #include #include "gbx_type.h" #include "gb_common_buffer.h" #include "gbx_local.h" #include "gbx_math.h" #include "gbx_string.h" #include "gbx_number.h" #define buffer_init COMMON_buffer_init #define get_char COMMON_get_char #define last_char COMMON_last_char #define look_char COMMON_look_char #define put_char COMMON_put_char #define jump_space COMMON_jump_space #define get_current COMMON_get_current #define buffer_pos COMMON_pos #define get_size_left COMMON_get_size_left #define has_string COMMON_has_string #define IS_PURE_INTEGER(_int64_val) ((_int64_val) == ((int)(_int64_val))) static uint64_t _pow_10[18] = { 10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000, 1000000000, 10000000000, 100000000000, 1000000000000, 10000000000000, 100000000000000, 1000000000000000, 10000000000000000, 100000000000000000, 1000000000000000000 }; static int read_integer(int base, bool minus, int64_t *result, bool local, bool after) { static unsigned char nmax_base[36] = { 0, 64, 40, 32, 27, 24, 22, 21, 20, 19, 18, 17, 17, 16, 16, 16, 15, 15, 15, 14, 14, 14, 14, 13, 13, 13, 13, 13, 13, 13, 12, 12, 12, 12, 12, 12 }; uint64_t nbr; int d, n, c, nmax; const char *thsep; int lthsep; int ndigit_thsep; bool first_thsep; thsep = LOCAL_get(local)->thousand_sep; lthsep = LOCAL_get(local)->len_thousand_sep; ndigit_thsep = 0; first_thsep = FALSE; n = 0; nbr = 0; nmax = nmax_base[base - 1]; c = last_char(); if (base == 10) { for(;;) { if (local) { COMMON_pos--; if (has_string(thsep, lthsep) && (ndigit_thsep == 3 || (!first_thsep && ndigit_thsep >= 1 && ndigit_thsep <= 3))) { COMMON_pos += lthsep; c = get_char(); first_thsep = TRUE; ndigit_thsep = 0; } else COMMON_pos++; } if (c >= '0' && c <= '9') { d = c - '0'; if (local) ndigit_thsep++; } else break; n++; if (n < nmax) { nbr = nbr * 10 + d; } else { if (__builtin_umull_overflow(nbr, 10, &nbr)) return NB_READ_OVERFLOW; if (__builtin_uaddl_overflow(nbr, (uint64_t)d, &nbr)) return NB_READ_OVERFLOW; } c = get_char(); if (c < 0) break; } c = last_char(); if (local && first_thsep && ndigit_thsep != 3) return NB_READ_SYNTAX; } else { for(;;) { if (c >= '0' && c <= '9') d = c - '0'; else if (c >= 'A' && c <='Z') d = c - 'A' + 10; else if (c >= 'a' && c <='z') d = c - 'a' + 10; else break; if (d >= base) break; n++; if (n < nmax) { nbr = nbr * base + d; } else { if (__builtin_umull_overflow(nbr, base, &nbr)) return NB_READ_OVERFLOW; if (__builtin_uaddl_overflow(nbr, (uint64_t)d, &nbr)) return NB_READ_OVERFLOW; } c = get_char(); if (c < 0) break; } if (after) { c = last_char(); if ((c == '&' || c == 'u' || c == 'U') && base != 10) c = get_char(); else { if ((base == 16 && n == 4) || (base == 2 && n == 16)) { if (nbr >= 0x8000L && nbr <= 0xFFFFL) nbr |= INT64_C(0xFFFFFFFFFFFF0000); } else if ((base == 16 && n == 8) || (base == 2 && n == 32)) { if (nbr >= 0x80000000L && nbr <= 0xFFFFFFFFL) nbr |= INT64_C(0xFFFFFFFF00000000); } } } } if (c > 0 && !isspace(c)) return NB_READ_SYNTAX; if (n == 0) return NB_READ_SYNTAX; *((int64_t *)result) = nbr; return NB_READ_INTEGER; } static bool read_float(double *result, bool local) { LOCAL_INFO *local_info; char point; const char *thsep; int lthsep; int ndigit_thsep; bool first_thsep; int c, n; uint64_t mantisse, mantisse_int; int ndigit_frac, ndigit_frac_zero; bool frac; bool frac_null; bool nozero; int nexp; bool nexp_minus; local_info = LOCAL_get(local); point = local_info->decimal_point; thsep = local_info->thousand_sep; lthsep = local_info->len_thousand_sep; ndigit_thsep = 0; first_thsep = FALSE; c = last_char(); n = 0; mantisse = 0; mantisse_int = 0; frac = FALSE; frac_null = TRUE; ndigit_frac = 0; ndigit_frac_zero = 0; nexp = 0; nexp_minus = FALSE; nozero = FALSE; // Integer part for(;;) { if (c == point) { c = get_char(); frac = TRUE; mantisse_int = mantisse; break; } if (local) { COMMON_pos--; if (has_string(thsep, lthsep) && (ndigit_thsep == 3 || (!first_thsep && ndigit_thsep >= 1 && ndigit_thsep <= 3))) { COMMON_pos += lthsep; first_thsep = TRUE; ndigit_thsep = 0; c = get_char(); } else COMMON_pos++; } if (!isdigit(c) || (c < 0)) break; if (c != '0') nozero = TRUE; if (nozero) n++; if (n > MAX_FLOAT_DIGIT) { if (n == (MAX_FLOAT_DIGIT + 1) && (c >= '5')) mantisse++; ndigit_frac--; // ??? c = get_char(); continue; } if (c == '0') mantisse *= 10; else mantisse = mantisse * 10 + (c - '0'); if (local) ndigit_thsep++; c = get_char(); if (c == 'e' || c == 'E') break; if (c < 0) goto __END; } // Decimal part for(;;) { if (c == point) break; if (!isdigit(c) || (c < 0)) break; if (c != '0') nozero = TRUE; if (nozero) n++; if (n > MAX_FLOAT_DIGIT) { if (n == (MAX_FLOAT_DIGIT + 1) && (c >= '5')) mantisse++; if (!frac) ndigit_frac--; c = get_char(); continue; } if (c == '0') ndigit_frac_zero++; else { frac_null = FALSE; ndigit_frac += ndigit_frac_zero + 1; mantisse = mantisse * _pow_10[ndigit_frac_zero] + (c - '0'); ndigit_frac_zero = 0; } c = get_char(); if (c == 'e' || c == 'E') break; if (c < 0) goto __END; } // Exponant if (c == 'e' || c == 'E') { c = get_char(); if (c == '+' || c == '-') { if (c == '-') nexp_minus = TRUE; c = get_char(); } if (!isdigit(c) || (c < 0)) return TRUE; for(;;) { nexp = nexp * 10 + (c - '0'); if (nexp > DBL_MAX_10_EXP) return TRUE; c = get_char(); if (!isdigit(c) || (c < 0)) break; } if (nexp_minus) nexp = (-nexp); } if (c >= 0 && !isspace(c)) return TRUE; __END: if (local && first_thsep && ndigit_thsep != 3) return TRUE; if (frac && frac_null) mantisse = mantisse_int; else nexp -= ndigit_frac; //fprintf(stderr, "%.24g %d\n", (double)mantisse, nexp); //*result = mulpow10((double)mantisse, nexp); *result = (double)mantisse * pow10(nexp); return FALSE; } bool NUMBER_from_string(int option, const char *str, int len, VALUE *value) { int c; int64_t val = 0; double dval = 0.0; TYPE type; int base = 10; bool minus = FALSE; int pos; buffer_init(str, len); jump_space(); c = get_char(); if (c == '+' || c == '-') { minus = (c == '-'); c = get_char(); } if (option & NB_READ_INT_LONG) { if (option & NB_READ_HEX_BIN) { if (c == '&') { c = get_char(); if (c == 'H' || c == 'h') { base = 16; c = get_char(); } else if (c == 'O' || c == 'o') { base = 8; c = get_char(); } else if (c == 'X' || c == 'x') { base = 2; c = get_char(); } else base = 16; } else if (c == '%') { base = 2; c = get_char(); } } } if (c < 0) return TRUE; if (c == '-' || c == '+') return TRUE; errno = 0; pos = COMMON_pos - 1; if (read_integer(base, minus, &val, (option & NB_LOCAL) != 0, TRUE) == NB_READ_INTEGER) { if (minus) val = (-val); if ((option & NB_READ_INTEGER) && IS_PURE_INTEGER(val)) { type = T_INTEGER; goto __END; } else if ((option & NB_READ_LONG)) { type = T_LONG; goto __END; } else if ((option & NB_READ_FLOAT) && base == 10) { type = T_FLOAT; dval = (double)val; goto __END; } } if ((option & NB_READ_FLOAT) && base == 10) { COMMON_pos = pos; get_char(); if (!read_float(&dval, (option & NB_LOCAL) != 0)) { if (minus) dval = (-dval); type = T_FLOAT; goto __END; } } return TRUE; __END: if (last_char() >= 0) //(c >= 0 && !isspace(c)) return TRUE; value->type = type; if (type == T_INTEGER) value->_integer.value = val; else if (type == T_LONG) value->_long.value = val; else value->_float.value = dval; //fprintf(stderr, "return FALSE\n"); return FALSE; } void NUMBER_int_to_string(uint64_t nbr, int prec, int base, VALUE *value) { char *ptr; char *src; int digit, len; bool neg; len = 0; ptr = &COMMON_buffer[COMMON_BUF_MAX]; if (nbr == 0 && prec == 0) { STRING_char_value(value, '0'); return; } neg = (nbr & (1LL << 63)) != 0; if (base == 10 && neg) nbr = 1 + ~nbr; while (nbr > 0) { digit = nbr % base; nbr /= base; ptr--; len++; if (digit < 10) *ptr = '0' + digit; else *ptr = 'A' + digit - 10; } if (neg) { if (prec) { ptr += len - prec; len = prec; } if (base == 10) { len++; ptr--; *ptr = '-'; } STRING_new_temp_value(value, NULL, len); src = value->_string.addr; memcpy(src, ptr, len); } else { STRING_new_temp_value(value, NULL, Max(len, prec)); src = value->_string.addr; while (prec > len) { *src++ = '0'; prec--; } memcpy(src, ptr, len); } } int NUMBER_read_integer(const char *str, int len, int base, int64_t *result) { int err; buffer_init(str, len); get_char(); err = read_integer(base, FALSE, result, FALSE, FALSE); if (err == NB_READ_INTEGER && !IS_PURE_INTEGER(*result)) err = NB_READ_LONG; return err; }