gambas-source-code/main/gbx/gbx_number.c
Benoît Minisini 9fd602df70 Add Base() / Base$() and Dec() / FromBase() subroutines.
[COMPILER]
* NEW: Add Base() / Base$() subroutines.
* NEW: Add Dec() / FromBase() subroutines.

[INTERPRRETER]
* NEW: Add Base() / Base$() subroutines.
* NEW: Add Dec() / FromBase() subroutines.
2023-09-29 02:51:42 +02:00

625 lines
10 KiB
C

/***************************************************************************
gbx_number.c
(c) 2000-2017 Benoît Minisini <benoit.minisini@gambas-basic.org>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2, or (at your option)
any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
MA 02110-1301, USA.
***************************************************************************/
#define __GBX_NUMBER_C
#include "gb_common.h"
#include "gb_error.h"
#include "gb_limit.h"
#include <ctype.h>
#include <float.h>
#include <math.h>
#include "gbx_type.h"
#include "gb_common_buffer.h"
#include "gbx_local.h"
#include "gbx_math.h"
#include "gbx_string.h"
#include "gbx_number.h"
#define buffer_init COMMON_buffer_init
#define get_char COMMON_get_char
#define last_char COMMON_last_char
#define look_char COMMON_look_char
#define put_char COMMON_put_char
#define jump_space COMMON_jump_space
#define get_current COMMON_get_current
#define buffer_pos COMMON_pos
#define get_size_left COMMON_get_size_left
#define has_string COMMON_has_string
#define IS_PURE_INTEGER(_int64_val) ((_int64_val) == ((int)(_int64_val)))
static uint64_t _pow_10[18] = {
10,
100,
1000,
10000,
100000,
1000000,
10000000,
100000000,
1000000000,
10000000000,
100000000000,
1000000000000,
10000000000000,
100000000000000,
1000000000000000,
10000000000000000,
100000000000000000,
1000000000000000000
};
static int read_integer(int base, bool minus, int64_t *result, bool local, bool after)
{
static unsigned char nmax_base[36] = {
0, 64, 40, 32, 27, 24, 22, 21, 20, 19,
18, 17, 17, 16, 16, 16, 15, 15, 15, 14,
14, 14, 14, 13, 13, 13, 13, 13, 13, 13,
12, 12, 12, 12, 12, 12
};
uint64_t nbr;
int d, n, c, nmax;
const char *thsep;
int lthsep;
int ndigit_thsep;
bool first_thsep;
thsep = LOCAL_get(local)->thousand_sep;
lthsep = LOCAL_get(local)->len_thousand_sep;
ndigit_thsep = 0;
first_thsep = FALSE;
n = 0;
nbr = 0;
nmax = nmax_base[base - 1];
c = last_char();
if (base == 10)
{
for(;;)
{
if (local)
{
COMMON_pos--;
if (has_string(thsep, lthsep) && (ndigit_thsep == 3 || (!first_thsep && ndigit_thsep >= 1 && ndigit_thsep <= 3)))
{
COMMON_pos += lthsep;
c = get_char();
first_thsep = TRUE;
ndigit_thsep = 0;
}
else
COMMON_pos++;
}
if (c >= '0' && c <= '9')
{
d = c - '0';
if (local)
ndigit_thsep++;
}
else
break;
n++;
if (n < nmax)
{
nbr = nbr * 10 + d;
}
else
{
if (__builtin_umull_overflow(nbr, 10, &nbr))
return NB_READ_OVERFLOW;
if (__builtin_uaddl_overflow(nbr, (uint64_t)d, &nbr))
return NB_READ_OVERFLOW;
}
c = get_char();
if (c < 0)
break;
}
c = last_char();
if (local && first_thsep && ndigit_thsep != 3)
return NB_READ_SYNTAX;
}
else
{
for(;;)
{
if (c >= '0' && c <= '9')
d = c - '0';
else if (c >= 'A' && c <='Z')
d = c - 'A' + 10;
else if (c >= 'a' && c <='z')
d = c - 'a' + 10;
else
break;
if (d >= base)
break;
n++;
if (n < nmax)
{
nbr = nbr * base + d;
}
else
{
if (__builtin_umull_overflow(nbr, base, &nbr))
return NB_READ_OVERFLOW;
if (__builtin_uaddl_overflow(nbr, (uint64_t)d, &nbr))
return NB_READ_OVERFLOW;
}
c = get_char();
if (c < 0)
break;
}
if (after)
{
c = last_char();
if ((c == '&' || c == 'u' || c == 'U') && base != 10)
c = get_char();
else
{
if ((base == 16 && n == 4) || (base == 2 && n == 16))
{
if (nbr >= 0x8000L && nbr <= 0xFFFFL)
nbr |= INT64_C(0xFFFFFFFFFFFF0000);
}
else if ((base == 16 && n == 8) || (base == 2 && n == 32))
{
if (nbr >= 0x80000000L && nbr <= 0xFFFFFFFFL)
nbr |= INT64_C(0xFFFFFFFF00000000);
}
}
}
}
if (c > 0 && !isspace(c))
return NB_READ_SYNTAX;
if (n == 0)
return NB_READ_SYNTAX;
*((int64_t *)result) = nbr;
return NB_READ_INTEGER;
}
static bool read_float(double *result, bool local)
{
LOCAL_INFO *local_info;
char point;
const char *thsep;
int lthsep;
int ndigit_thsep;
bool first_thsep;
int c, n;
uint64_t mantisse, mantisse_int;
int ndigit_frac, ndigit_frac_zero;
bool frac;
bool frac_null;
bool nozero;
int nexp;
bool nexp_minus;
local_info = LOCAL_get(local);
point = local_info->decimal_point;
thsep = local_info->thousand_sep;
lthsep = local_info->len_thousand_sep;
ndigit_thsep = 0;
first_thsep = FALSE;
c = last_char();
n = 0;
mantisse = 0;
mantisse_int = 0;
frac = FALSE;
frac_null = TRUE;
ndigit_frac = 0;
ndigit_frac_zero = 0;
nexp = 0;
nexp_minus = FALSE;
nozero = FALSE;
// Integer part
for(;;)
{
if (c == point)
{
c = get_char();
frac = TRUE;
mantisse_int = mantisse;
break;
}
if (local)
{
COMMON_pos--;
if (has_string(thsep, lthsep) && (ndigit_thsep == 3 || (!first_thsep && ndigit_thsep >= 1 && ndigit_thsep <= 3)))
{
COMMON_pos += lthsep;
first_thsep = TRUE;
ndigit_thsep = 0;
c = get_char();
}
else
COMMON_pos++;
}
if (!isdigit(c) || (c < 0))
break;
if (c != '0')
nozero = TRUE;
if (nozero)
n++;
if (n > MAX_FLOAT_DIGIT)
{
if (n == (MAX_FLOAT_DIGIT + 1) && (c >= '5'))
mantisse++;
ndigit_frac--; // ???
c = get_char();
continue;
}
if (c == '0')
mantisse *= 10;
else
mantisse = mantisse * 10 + (c - '0');
if (local)
ndigit_thsep++;
c = get_char();
if (c == 'e' || c == 'E')
break;
if (c < 0)
goto __END;
}
// Decimal part
for(;;)
{
if (c == point)
break;
if (!isdigit(c) || (c < 0))
break;
if (c != '0')
nozero = TRUE;
if (nozero)
n++;
if (n > MAX_FLOAT_DIGIT)
{
if (n == (MAX_FLOAT_DIGIT + 1) && (c >= '5'))
mantisse++;
if (!frac)
ndigit_frac--;
c = get_char();
continue;
}
if (c == '0')
ndigit_frac_zero++;
else
{
frac_null = FALSE;
ndigit_frac += ndigit_frac_zero + 1;
mantisse = mantisse * _pow_10[ndigit_frac_zero] + (c - '0');
ndigit_frac_zero = 0;
}
c = get_char();
if (c == 'e' || c == 'E')
break;
if (c < 0)
goto __END;
}
// Exponant
if (c == 'e' || c == 'E')
{
c = get_char();
if (c == '+' || c == '-')
{
if (c == '-')
nexp_minus = TRUE;
c = get_char();
}
if (!isdigit(c) || (c < 0))
return TRUE;
for(;;)
{
nexp = nexp * 10 + (c - '0');
if (nexp > DBL_MAX_10_EXP)
return TRUE;
c = get_char();
if (!isdigit(c) || (c < 0))
break;
}
if (nexp_minus)
nexp = (-nexp);
}
if (c >= 0 && !isspace(c))
return TRUE;
__END:
if (local && first_thsep && ndigit_thsep != 3)
return TRUE;
if (frac && frac_null)
mantisse = mantisse_int;
else
nexp -= ndigit_frac;
//fprintf(stderr, "%.24g %d\n", (double)mantisse, nexp);
//*result = mulpow10((double)mantisse, nexp);
*result = (double)mantisse * pow10(nexp);
return FALSE;
}
bool NUMBER_from_string(int option, const char *str, int len, VALUE *value)
{
int c;
int64_t val = 0;
double dval = 0.0;
TYPE type;
int base = 10;
bool minus = FALSE;
int pos;
buffer_init(str, len);
jump_space();
c = get_char();
if (c == '+' || c == '-')
{
minus = (c == '-');
c = get_char();
}
if (option & NB_READ_INT_LONG)
{
if (option & NB_READ_HEX_BIN)
{
if (c == '&')
{
c = get_char();
if (c == 'H' || c == 'h')
{
base = 16;
c = get_char();
}
else if (c == 'O' || c == 'o')
{
base = 8;
c = get_char();
}
else if (c == 'X' || c == 'x')
{
base = 2;
c = get_char();
}
else
base = 16;
}
else if (c == '%')
{
base = 2;
c = get_char();
}
}
}
if (c < 0)
return TRUE;
if (c == '-' || c == '+')
return TRUE;
errno = 0;
pos = COMMON_pos - 1;
if (read_integer(base, minus, &val, (option & NB_LOCAL) != 0, TRUE) == NB_READ_INTEGER)
{
if (minus) val = (-val);
if ((option & NB_READ_INTEGER) && IS_PURE_INTEGER(val))
{
type = T_INTEGER;
goto __END;
}
else if ((option & NB_READ_LONG))
{
type = T_LONG;
goto __END;
}
else if ((option & NB_READ_FLOAT) && base == 10)
{
type = T_FLOAT;
dval = (double)val;
goto __END;
}
}
if ((option & NB_READ_FLOAT) && base == 10)
{
COMMON_pos = pos;
get_char();
if (!read_float(&dval, (option & NB_LOCAL) != 0))
{
if (minus) dval = (-dval);
type = T_FLOAT;
goto __END;
}
}
return TRUE;
__END:
if (last_char() >= 0) //(c >= 0 && !isspace(c))
return TRUE;
value->type = type;
if (type == T_INTEGER)
value->_integer.value = val;
else if (type == T_LONG)
value->_long.value = val;
else
value->_float.value = dval;
//fprintf(stderr, "return FALSE\n");
return FALSE;
}
void NUMBER_int_to_string(uint64_t nbr, int prec, int base, VALUE *value)
{
char *ptr;
char *src;
int digit, len;
bool neg;
len = 0;
ptr = &COMMON_buffer[COMMON_BUF_MAX];
if (nbr == 0 && prec == 0)
{
STRING_char_value(value, '0');
return;
}
neg = (nbr & (1LL << 63)) != 0;
if (base == 10 && neg)
nbr = 1 + ~nbr;
while (nbr > 0)
{
digit = nbr % base;
nbr /= base;
ptr--;
len++;
if (digit < 10)
*ptr = '0' + digit;
else
*ptr = 'A' + digit - 10;
}
if (neg)
{
if (prec)
{
ptr += len - prec;
len = prec;
}
if (base == 10)
{
len++;
ptr--;
*ptr = '-';
}
STRING_new_temp_value(value, NULL, len);
src = value->_string.addr;
memcpy(src, ptr, len);
}
else
{
STRING_new_temp_value(value, NULL, Max(len, prec));
src = value->_string.addr;
while (prec > len)
{
*src++ = '0';
prec--;
}
memcpy(src, ptr, len);
}
}
int NUMBER_read_integer(const char *str, int len, int base, int64_t *result)
{
int err;
buffer_init(str, len);
get_char();
err = read_integer(base, FALSE, result, FALSE, FALSE);
if (err == NB_READ_INTEGER && !IS_PURE_INTEGER(*result))
err = NB_READ_LONG;
return err;
}