gambas 58ddc650ad Try to add some more static datatype analysis, but did not succed.
[COMPILER]
* NEW: Try to add some more static datatype analysis, but did not succed.
2018-03-03 03:14:11 +01:00

857 lines
15 KiB
C

/***************************************************************************
gbc_trans.c
(c) 2000-2017 Benoît Minisini <g4mba5@gmail.com>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2, or (at your option)
any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
MA 02110-1301, USA.
***************************************************************************/
#define __GBC_TRANS_C
#include <stdlib.h>
#include <string.h>
#include <stdio.h>
#include <ctype.h>
#include <errno.h>
#include <math.h>
#include <float.h>
#include <limits.h>
#include "gb_common.h"
#include "gb_error.h"
#include "gbc_compile.h"
#include "gbc_read.h"
#include "gbc_trans.h"
#include "gb_reserved.h"
#include "gb_code.h"
#define IS_PURE_INTEGER(_int64_val) ((_int64_val) == ((int)(_int64_val)))
short TRANS_in_assignment = 0;
short TRANS_in_left_value = 0;
bool TRANS_in_try = FALSE;
void TRANS_reset(void)
{
JOB->line = JOB->first_line;
JOB->current = JOB->pattern;
JOB->end = &(JOB->pattern[JOB->pattern_count]);
}
static bool read_integer(char *number, int base, bool minus, int64_t *result)
{
uint64_t nbr2, nbr;
int d, n;
unsigned char c;
int nmax;
n = 0;
nbr = 0;
switch (base)
{
case 2: nmax = 64; break;
case 8: nmax = 21; break;
case 16: nmax = 16; break;
case 10: default: nmax = 19; break;
}
if (base == 10)
{
c = *number++;
for(;;)
{
if (isdigit(c))
d = c - '0';
else
break;
n++;
if (n < nmax)
nbr = nbr * 10 + d;
else
{
nbr2 = nbr * 10 + d;
if ((nbr2 / 10) != nbr || nbr2 > ((uint64_t)LLONG_MAX + minus))
return TRUE;
nbr = nbr2;
}
c = *number++;
if (!c)
break;
}
}
else
{
c = *number++;
for(;;)
{
if (isdigit(c))
d = c - '0';
else if (c >= 'A' && c <='Z')
d = c - 'A' + 10;
else if (c >= 'a' && c <='z')
d = c - 'a' + 10;
else
break;
if (d >= base)
break;
n++;
if (n > nmax)
return TRUE;
nbr = nbr * base + d;
c = *number++;
if (!c)
break;
}
if ((c == '&' || c == 'u' || c == 'U') && base != 10)
c = *number++;
else
{
if ((base == 16 && n == 4) || (base == 2 && n == 16))
{
if (nbr >= 0x8000L && nbr <= 0xFFFFL)
nbr |= INT64_C(0xFFFFFFFFFFFF0000);
}
else if ((base == 16 && n == 8) || (base == 2 && n == 32))
{
if (nbr >= 0x80000000L && nbr <= 0xFFFFFFFFL)
nbr |= INT64_C(0xFFFFFFFF00000000);
}
}
}
if (c)
return TRUE;
if (n == 0)
return TRUE;
*((int64_t *)result) = nbr;
return FALSE;
}
static bool read_float(char *number, double *result)
{
unsigned char c;
double nint;
double nfrac, n;
int nexp;
bool nexp_minus;
nint = 0.0;
nfrac = 0.0;
nexp = 0;
nexp_minus = FALSE;
c = *number++;
/* Integer part */
for(;;)
{
if (c == '.')
{
c = *number++;
break;
}
if (!c || !isdigit(c))
return TRUE;
nint = nint * 10 + (c - '0');
c = *number++;
if (c == 'e' || c == 'E')
break;
if (!c || isspace(c))
goto __END;
}
/* Decimal part */
n = 0.1;
for(;;)
{
if (!c || !isdigit(c))
break;
nfrac += n * (c - '0');
n /= 10;
c = *number++;
}
/* Exponent */
if (c == 'e' || c == 'E')
{
c = *number++;
if (c == '+' || c == '-')
{
if (c == '-')
nexp_minus = TRUE;
c = *number++;
}
if (!c || !isdigit(c))
return TRUE;
for(;;)
{
nexp = nexp * 10 + (c - '0');
if (nexp > DBL_MAX_10_EXP)
return TRUE;
c = *number++;
if (!c || !isdigit(c))
break;
}
}
if (c)
return TRUE;
__END:
*result = (nint + nfrac) * pow(10, nexp_minus ? (-nexp) : nexp);
return FALSE;
}
bool TRANS_get_number(int index, TRANS_NUMBER *result)
{
char buffer[68];
SYMBOL *sym;
char *number;
unsigned char c;
int64_t val = 0;
double dval = 0.0;
int type;
int base = 10;
bool minus = FALSE;
bool complex = FALSE;
sym = TABLE_get_symbol(JOB->class->table, index);
if (sym->len > 66)
return TRUE;
memcpy(buffer, sym->name, sym->len);
buffer[sym->len] = 0;
number = buffer;
c = *number++;
if (c == '+' || c == '-')
{
minus = (c == '-');
c = *number++;
}
if (c == '&')
{
c = *number++;
if (c == 'H' || c == 'h')
{
base = 16;
c = *number++;
}
else if (c == 'X' || c == 'x')
{
base = 2;
c = *number++;
}
else if (c == 'O' || c == 'o')
{
base = 8;
c = *number++;
}
else
base = 16;
}
else if (c == '%')
{
base = 2;
c = *number++;
}
if (!c)
return TRUE;
if (c == '-' || c == '+')
return TRUE;
errno = 0;
number--;
if (base == 10 && tolower(buffer[sym->len - 1]) == 'i')
{
buffer[sym->len - 1] = 0;
complex = TRUE;
}
if (!read_integer(number, base, minus, &val))
{
if (minus) val = (-val);
if (IS_PURE_INTEGER(val))
{
type = T_INTEGER;
goto __END;
}
else
{
type = T_LONG;
goto __END;
}
}
if (base == 10)
{
if (!read_float(number, &dval))
{
if (minus) dval = (-dval);
type = T_FLOAT;
goto __END;
}
}
return TRUE;
__END:
result->type = type;
result->complex = complex;
if (type == T_INTEGER)
result->lval = result->ival = val;
else if (type == T_LONG)
result->lval = val;
else
result->dval = dval;
return FALSE;
}
static PATTERN *trans_embedded_array(PATTERN *look, int mode, TRANS_DECL *result)
{
TRANS_NUMBER tnum;
int i;
if (!(mode & TT_CAN_EMBED))
{
if (PATTERN_is(*look, RS_LSQR))
THROW("Embedded arrays are forbidden here");
return look;
}
if (!PATTERN_is(*look, RS_LSQR))
return look;
look++;
if (mode && TT_CAN_ARRAY)
{
for (i = 0;; i++)
{
if (i >= MAX_ARRAY_DIM)
THROW("Too many dimensions");
if (!PATTERN_is_number(*look))
THROW(E_SYNTAX);
if (TRANS_get_number(PATTERN_index(*look), &tnum))
THROW(E_SYNTAX);
if (tnum.type != T_INTEGER)
THROW(E_SYNTAX);
if (tnum.ival < 1 || tnum.ival > (2 << 22)) /* 4 Mo, ca devrait suffire... ;-) */
THROW("Bad subscript range");
result->array.dim[i] = tnum.ival;
result->array.ndim++;
look++;
if (PATTERN_is(*look, RS_RSQR))
break;
if (!PATTERN_is(*look, RS_COMMA))
THROW(E_MISSING, "','");
look++;
}
}
if (!PATTERN_is(*look, RS_RSQR))
THROW(E_MISSING, "']'");
result->is_embedded = TRUE;
look++;
return look;
}
static int TRANS_get_class(PATTERN pattern, bool array)
{
int index = PATTERN_index(pattern);
int index_array;
//CLASS_REF *cref;
if (!CLASS_exist_class(JOB->class, index))
{
if (array)
{
// Maybe a compound class?
CLASS_SYMBOL *sym = CLASS_get_symbol(JOB->class, index);
int i;
char c;
//fprintf(stderr, "TRANS_get_class: %.*s\n", sym->symbol.len, sym->symbol.name);
for (i = sym->symbol.len - 1; i >= 0; i--)
{
c = sym->symbol.name[i];
if (c == '[')
{
//fprintf(stderr, "TRANS_get_class: find %.*s\n", i, sym->symbol.name);
if (TABLE_find_symbol(JOB->class->table, sym->symbol.name, i, &index_array))
{
index_array = TRANS_get_class(PATTERN_make(RT_CLASS, index_array), TRUE);
if (JOB->class->class[index_array].exported)
index = CLASS_add_class_exported(JOB->class, index);
else
index = CLASS_add_class(JOB->class, index);
/*cref = &JOB->class->class[index];
if (TYPE_is_null(cref->array))
{
cref->array.t.id = T_OBJECT;
cref->array.t.value = index_array;
}*/
return index;
}
}
}
}
THROW("Unknown identifier: &1", TABLE_get_symbol_name(JOB->class->table, index));
}
return CLASS_add_class(JOB->class, index);
}
static bool check_structure(int *cindex)
{
SYMBOL *sym = TABLE_get_symbol(JOB->class->table, JOB->class->class[*cindex].index);
int len = sym->len;
char name[sym->len + 1];
int index;
bool is_array;
strncpy(name, sym->name, len);
while (name[len - 1] == ']')
len -= 2;
name[len] = 0;
if (len < sym->len)
{
if (!TABLE_find_symbol(JOB->class->table, name, len, &index))
goto __ERROR;
index = CLASS_add_class(JOB->class, index);
is_array = TRUE;
}
else
{
index = *cindex;
is_array = FALSE;
}
if (JOB->class->class[index].structure)
{
*cindex = index;
return is_array;
}
__ERROR:
THROW("&1 is not a structure", name);
}
bool TRANS_type(int mode, TRANS_DECL *result)
{
PATTERN *look = JOB->current;
short id;
int value;
int flag = 0;
bool is_array;
/* Do not fill the structure with zeros */
TYPE_clear(&result->type);
result->is_new = FALSE;
result->is_embedded = FALSE;
result->init = NULL;
result->array.ndim = 0;
look = trans_embedded_array(look, mode, result);
if (!PATTERN_is(*look, RS_AS))
{
if (mode & TT_DO_NOT_CHECK_AS)
return FALSE;
else
THROW(E_MISSING, "AS");
}
look++;
if (mode & TT_CAN_NEW)
{
if (PATTERN_is(*look, RS_NEW))
{
if (result->is_embedded) //TYPE_get_id(result->type) == T_ARRAY)
THROW("Cannot mix NEW and embedded array");
result->is_new = TRUE;
look++;
result->init = look;
}
}
if ((mode & TT_CAN_EMBED) && PATTERN_is(*look, RS_STRUCT))
{
id = T_STRUCT;
look++;
if (!PATTERN_is_class(*look))
THROW_UNEXPECTED(look);
value = TRANS_get_class(*look, TRUE);
is_array = check_structure(&value);
if (!is_array)
{
if (result->is_new)
THROW("Cannot mix NEW and embedded structure");
//if (result->array.ndim > 0)
// THROW("Cannot mix embedded array and embedded structure");
}
else
THROW("Arrays of structure are not supported");
look++;
}
else
{
if (!PATTERN_is_type(*look) && !PATTERN_is_class(*look))
THROW_UNEXPECTED(look);
if (PATTERN_is_type(*look))
{
id = RES_get_type(PATTERN_index(*look));
value = -1;
}
else
{
id = T_OBJECT;
value = TRANS_get_class(*look, TRUE);
}
if (PATTERN_is(look[1], RS_LSQR))
{
value = CLASS_get_array_class(JOB->class, id, value);
id = T_OBJECT;
if (!PATTERN_is(look[2], RS_RSQR))
{
if ((mode & TT_CAN_NEW) && result->is_new)
{
//if (TYPE_get_id(result->type) == T_ARRAY)
// THROW("Cannot mix NEW and static array declaration");
//result->is_new = TRUE;
result->init = look;
}
else
THROW("Syntax error");
}
while (!PATTERN_is_newline(*look))
look++;
}
else
{
//if (id == T_OBJECT)
// value = (-1);
look++;
}
}
if (id == T_VOID)
return FALSE;
/*
if (result->is_array && result->array.ndim == 0)
result->is_array = FALSE;
*/
if (result->array.ndim > 0)
{
result->array.type = TYPE_make(id, value, flag);
result->type = TYPE_make(T_ARRAY, CLASS_add_array(JOB->class, &result->array), 0);
}
else if (id == T_STRUCT)
{
result->type = TYPE_make(id, value, flag);
}
else
{
result->type = TYPE_make(id, value, flag);
if ((mode & TT_CAN_NEW) && !result->is_new && PATTERN_is(*look, RS_EQUAL))
{
look++;
result->init = look;
while (!PATTERN_is_newline(*look))
look++;
}
}
JOB->current = look;
return TRUE;
}
bool TRANS_check_declaration(void)
{
PATTERN *look = JOB->current;
if (!PATTERN_is_identifier(*look))
return FALSE;
look++;
if (PATTERN_is(*look, RS_LSQR))
{
for(;;)
{
look++;
if (PATTERN_is(*look, RS_RSQR))
break;
if (PATTERN_is_newline(*look))
return FALSE;
}
look++;
}
if (!PATTERN_is(*look, RS_AS))
return FALSE;
return TRUE;
}
PATTERN *TRANS_get_constant_value(TRANS_DECL *decl, PATTERN *current)
{
int index;
TRANS_NUMBER number = {0};
int type;
PATTERN value;
type = TYPE_get_id(decl->type);
value = *current++;
index = PATTERN_index(value);
if (type == T_STRING)
{
if (PATTERN_is(value, RS_LBRA))
{
value = *current++;
if (!PATTERN_is_string(value))
THROW("Constant string expected");
index = PATTERN_index(value);
value = *current++;
if (!PATTERN_is(value, RS_RBRA))
THROW("Missing right brace");
TYPE_set_id(&decl->type, T_CSTRING);
}
else
{
if (!PATTERN_is_string(value))
THROW("Constant string expected");
}
decl->is_integer = FALSE;
decl->value = index;
}
else
{
if (PATTERN_is_string(value))
THROW("Syntax error");
if (type != T_BOOLEAN && type <= T_FLOAT)
{
if (TRANS_get_number(index, &number))
THROW("Type mismatch");
}
switch(type)
{
case T_BOOLEAN:
decl->is_integer = TRUE;
if (PATTERN_is(value, RS_TRUE))
decl->value = -1L;
else if (PATTERN_is(value, RS_FALSE))
decl->value = 0L;
else
THROW("Type mismatch");
break;
case T_BYTE: case T_SHORT: case T_INTEGER:
decl->is_integer = TRUE;
if (number.type != T_INTEGER)
{
if (number.type == T_LONG)
THROW("Out of range");
else
THROW("Type mismatch");
}
if (((type == T_BYTE) && (number.ival < 0 || number.ival > 255))
|| ((type == T_SHORT) && (number.ival < -32768L || number.ival > 32767L)))
THROW("Out of range");
decl->value = number.ival;
//fprintf(stderr, "TRANS_get_constant_value: INT: %ld\n", decl->value);
break;
case T_FLOAT: case T_SINGLE:
if (type == T_SINGLE && !finite((float)number.dval))
THROW("Out of range");
decl->is_integer = FALSE;
decl->value = index;
break;
case T_LONG:
if (number.type == T_FLOAT)
THROW("Type mismatch");
decl->is_integer = FALSE;
decl->value = index;
decl->lvalue = number.lval;
//fprintf(stderr, "TRANS_get_constant_value: LONG: %lld\n", decl->lvalue);
break;
default:
THROW("Bad constant type");
}
}
return current;
}
void TRANS_want(int reserved, char *msg)
{
if (!PATTERN_is(*JOB->current, reserved))
THROW("Syntax error. &1 expected", msg ? msg : COMP_res_info[reserved].name);
JOB->current++;
}
void TRANS_want_newline()
{
if (!TRANS_newline())
THROW_UNEXPECTED(JOB->current);
}
void TRANS_ignore(int reserved)
{
if (PATTERN_is(*JOB->current, reserved))
JOB->current++;
}
bool TRANS_is_end_function(bool is_proc, PATTERN *look)
{
if (PATTERN_is_newline(*look))
return TRUE;
if (is_proc)
return PATTERN_is(*look, RS_PROCEDURE) || PATTERN_is(*look, RS_SUB);
else
return PATTERN_is(*look, RS_FUNCTION);
}
char *TRANS_get_num_desc(int num)
{
static const char *num_desc[3] = { "first", "second", "third" };
static char desc[6];
if (num < 1)
return NULL;
if (ERROR_translate)
{
snprintf(desc, sizeof(desc), "#%d", num);
}
else
{
if (num < 4)
return (char *)num_desc[num - 1];
snprintf(desc, sizeof(desc), "%dth", num);
}
return desc;
}