#include <stdlib.h>
#include <assert.h>
#include <string.h>
#include <stdio.h>
#include "semantics.h"
#include "ast.h"
#define NEW(type) ((type *)malloc(sizeof(type)))
#define CHECK_TYPE(p, _type) assert(p->type == _type)
#define ERROR(x) do { error_print x; } while (0)
#define WARNING(x) do { warning_print x; } while (0)
#define NOT_IGNORE_VOID(et, ast) \
if (et->type == CVOID) \
do { \
ERROR((ast, "void value not ignored as it ought to be")); \
} while (0)
#define INCOMP_TYPE(ast) \
do { \
ERROR((ast, "incompatible types when assigning")); \
} while (0)
/* pointer to function conversion (std 6.3.2/4) */
#define FUNC_POINTER_CONV(t) \
do { \
if ((t)->type == CFUNC) \
{ \
CType_t f = ctype_create("", CPTR, p); \
f->rec.ref = t; \
t = f; \
} \
} while (0)
#define CHECK_CVOID(name, ast) \
if (type_spec->type == CVOID) \
do { \
ERROR((ast, "variable or field '%s' declared void", name)); \
} while (0)
#define IS_INT(tt) ((tt) == CINT || (tt) == CCHAR)
#define IS_PTR(tt) ((tt) == CPTR || (tt) == CARR)
#define IS_SCALAR(tt) (!((tt) == CUNION || (tt) == CSTRUCT))
#define IS_ARITH(tt) IS_INT(tt)
extern void print_error(char *, char *, int, int, int);
extern char *load_line(int);
static char err_buff[MAX_ERROR_BUFF];
static CType_t basic_type_int;
static CType_t basic_type_char;
static CType_t basic_type_void;
static CType_t builtin_printf;
static CType_t builtin_scanf;
static CType_t builtin_malloc;
static void error_print(CNode *ast, const char *fmt, ...) {
va_list args;
va_start(args, fmt);
vsprintf(err_buff, fmt, args);
print_error(err_buff, NULL, ast->loc.row, ast->loc.col, 0);
va_end(args);
}
static void warning_print(CNode *ast, const char *fmt, ...) {
va_list args;
va_start(args, fmt);
vsprintf(err_buff, fmt, args);
print_error(err_buff, NULL, ast->loc.row, ast->loc.col, 1);
va_end(args);
}
const char *csymbol_getname(CSymbol_t sym) {
return (sym->kind == CVAR) ?
sym->rec.var->name : sym->rec.type->name;
}
#ifdef CIBIC_DEBUG
CTable_t ctable_create(Hashfunc_t hfunc, Printfunc_t pfunc) {
CTable_t ct = NEW(CTable);
memset(ct->head, 0, sizeof(CTNode*) * MAX_TABLE_SIZE);
ct->hfunc = hfunc;
ct->pfunc = pfunc;
return ct;
}
#else
CTable_t ctable_create(Hashfunc_t hfunc) {
CTable_t ct = NEW(CTable);
memset(ct->head, 0, sizeof(CTNode*) * MAX_TABLE_SIZE);
ct->hfunc = hfunc;
return ct;
}
#endif
void ctable_destory(CTable_t ct) {
int i;
for (i = 0; i < MAX_TABLE_SIZE; i++)
{
CTNode *p, *np;
for (p = ct->head[i]; p; p = np)
{
np = p->next;
free(p);
}
}
}
void *ctable_lookup(CTable_t ct, const char *key) {
unsigned int hv = ct->hfunc(key) % MAX_TABLE_SIZE;
CTNode *p = ct->head[hv];
for (; p; p = p->next)
if (!strcmp(p->key, key))
return p->val;
return NULL; /* not found */
}
int ctable_insert(CTable_t ct, const char *key, void *val, int lvl) {
unsigned int hv = ct->hfunc(key) % MAX_TABLE_SIZE;
CTNode *p = ct->head[hv];
CTNode *np;
for (; p && p->lvl == lvl; p = p->next)
if (!strcmp(p->key, key))
return 0; /* conflict */
np = NEW(CTNode);
np->key = key;
np->val = val;
np->lvl = lvl;
np->next = ct->head[hv];
ct->head[hv] = np;
return 1;
}
void ctable_clip(CTable_t ct, const char *key, int max_lvl) {
unsigned int hv = ct->hfunc(key) % MAX_TABLE_SIZE;
CTNode *p = ct->head[hv], *np;
for (; p && p->lvl > max_lvl; p = np)
{
np = p->next;
free(p);
}
ct->head[hv] = p;
}
CScope_t cscope_create() {
CScope_t p = NEW(CScope);
p->lvl = -1;
p->top = NULL;
p->func = NULL;
p->inside_loop = 0;
#ifdef CIBIC_DEBUG
p->ids = ctable_create(bkdr_hash, csymbol_print);
p->tags = ctable_create(bkdr_hash, csymbol_print);
#else
p->ids = ctable_create(bkdr_hash);
p->tags = ctable_create(bkdr_hash);
#endif
cscope_enter(p);
return p;
}
static int cscope_push(CScope_t cs, CSymbol_t sym, int nspace) {
CTable_t ct = nspace == NS_ID ? cs->ids: cs->tags;
#ifdef CIBIC_DEBUG
assert(cs->top);
#endif
if (ctable_insert(ct, csymbol_getname(sym), sym, cs->lvl))
{
CSElem *e = NEW(CSElem);
e->sym = sym;
e->next = cs->top->symlist;
cs->top->symlist = e;
return 1;
}
else return 0; /* naming conflict */
}
int cscope_push_var(CScope_t cs, CVar_t var, int nspace) {
CSymbol_t p = NEW(CSymbol);
p->kind = CVAR;
p->rec.var = var;
if (!cscope_push(cs, p, nspace))
{
free(p);
return 0;
}
return 1;
}
int cscope_push_type(CScope_t cs, CType_t type, int nspace) {
CSymbol_t p = NEW(CSymbol);
p->kind = CTYPE;
p->rec.type = type;
if (!cscope_push(cs, p, nspace))
{
free(p);
return 0;
}
return 1;
}
void cscope_enter(CScope_t cs) {
CSNode *np = NEW(CSNode);
np->next = cs->top;
np->symlist = NULL;
cs->top = np;
cs->lvl++;
}
void cscope_exit(CScope_t cs) {
CSNode *top_o = cs->top;
CSElem *p, *np;
cs->lvl--;
cs->top = top_o->next;
for (p = top_o->symlist; p; p = np)
{
const char *name = csymbol_getname(p->sym);
ctable_clip(cs->ids, name, cs->lvl);
ctable_clip(cs->tags, name, cs->lvl);
np = p->next;
free(p->sym); /* free CSymbol */
free(p); /* free CSElem */
}
free(top_o);
}
void ctable_debug_print(CTable_t ct) {
int i;
fprintf(stderr, "*** CTable ***\n");
for (i = 0; i < MAX_TABLE_SIZE; i++)
if (ct->head[i])
{
CTNode *p;
fprintf(stderr, "[%04d]", i);
for (p = ct->head[i]; p; p = p->next)
fprintf(stderr, "->[%s:%d]", ct->pfunc(p->val), p->lvl);
fprintf(stderr, "\n");
}
fprintf(stderr, "*** CTable ***\n");
}
void cscope_debug_print(CScope_t cs) {
int lvl = cs->lvl;
CSNode *p;
CSElem *tp;
fprintf(stderr, "\n****** CScope ******\n");
for (p = cs->top; p; p = p->next)
{
fprintf(stderr, "Level %d:\n", lvl--);
for (tp = p->symlist; tp; tp = tp->next)
fprintf(stderr, "%s ", csymbol_print(tp->sym));
fprintf(stderr, "\n\n");
}
fprintf(stderr, "IDs:\n");
ctable_debug_print(cs->ids);
fprintf(stderr, "Tags:\n");
ctable_debug_print(cs->tags);
fprintf(stderr, "****** CScope ******\n\n");
}
CSymbol_t cscope_lookup(CScope_t cs, const char *name, int nspace) {
if (nspace == NS_ID)
return ctable_lookup(cs->ids, name);
else
return ctable_lookup(cs->tags, name);
return NULL;
}
unsigned int bkdr_hash(const char *str) {
unsigned int seed = 131;
unsigned int hv = 0;
while (*str)
hv = hv * seed + (unsigned)(*str++);
return hv;
}
const char *csymbol_print(void *csym) {
CSymbol_t p = (CSymbol_t)csym;
static char buff[MAX_DEBUG_PRINT_BUFF];
if (p->kind == CVAR)
sprintf(buff, "%s@%lx", p->rec.var->name, (size_t)p->rec.var);
else
sprintf(buff, "%s@%lx", p->rec.type->name, (size_t)p->rec.type);
return buff;
}
const char *ctable_cvar_print(void *var) {
static char buff[MAX_DEBUG_PRINT_BUFF];
sprintf(buff, "%s@%lx", ((CVar_t )var)->name, (size_t)var);
return buff;
}
CVar_t cvar_create(const char *name, CType_t type, CNode *ast) {
CVar_t cv = NEW(CVar);
cv->name = name;
cv->type = type;
cv->ast = ast;
return cv;
}
CType_t ctype_create(const char *name, int type, CNode *ast) {
CType_t ct = NEW(CType);
ct->name = name;
ct->type = type;
ct->ast = ast;
switch (type)
{
case CINT: ct->size = INT_SIZE; break;
case CCHAR: ct->size = CHAR_SIZE; break;
case CVOID: ct->size = 0; break;
}
return ct;
}
void ctype_print(CType_t);
void cvar_print(CVar_t cv) {
fprintf(stderr, "[var@%lx:%s]->", (size_t)cv, cv->name);
ctype_print(cv->type);
}
void ctype_print(CType_t ct) {
switch (ct->type)
{
case CINT:
fprintf(stderr, "[int]"); break;
case CCHAR:
fprintf(stderr, "[char]"); break;
case CVOID:
fprintf(stderr, "[void]"); break;
case CSTRUCT:
case CUNION:
{
CTable_t f = ct->rec.fields;
int i;
CTNode *fn;
fprintf(stderr, "[%s@%lx:(name:%s|fields:",
ct->type == CSTRUCT ? "struct" : "union",
(size_t)ct,
ct->name);
if (f)
{
int first = 1;
for (i = 0; i < MAX_TABLE_SIZE; i++)
for (fn = f->head[i]; fn; fn = fn->next)
{
fprintf(stderr, "%s", first ? (first = 0, "") : ",");
cvar_print((CVar_t)fn->val);
}
}
fprintf(stderr, ")]");
}
break;
case CARR:
{
fprintf(stderr, "[arr:(%d)]->", ct->rec.arr.len);
ctype_print(ct->rec.arr.elem);
}
break;
case CPTR:
{
fprintf(stderr, "[ptr]->");
ctype_print(ct->rec.ref);
}
break;
case CFUNC:
{
CVar_t p;
fprintf(stderr, "[func:(name:%s|params:", ct->name);
for (p = ct->rec.func.params; p; p = p->next)
{
cvar_print(p);
if (p->next) fprintf(stderr, ",");
}
fprintf(stderr, "|local:");
for (p = ct->rec.func.local; p; p = p->next)
{
cvar_print(p);
if (p->next) fprintf(stderr, ",");
}
fprintf(stderr, ")]->");
ctype_print(ct->rec.func.ret);
}
break;
}
}
static CType_t struct_type_merge(CType_t new, CScope_t scope) {
/* Note: we shall try to lookup first instead of pushing !! */
CSymbol_t lu = cscope_lookup(scope, new->name, NS_TAG);
CType_t old;
if (!lu) /* create it if it does not exist */
{
cscope_push_type(scope, new, NS_TAG);
return new;
} /* otherwise we have it */
old = lu->rec.type;
if (old->type != new->type) /* not a struct or union */
ERROR((new->ast, "conflicting types of '%s'", new->name));
/* otherwise it is a struct or union */
if (!new->rec.fields) /* use the old definition */
return old;
/* otherwise there's a completion definition */
if (cscope_push_type(scope, new, NS_TAG)) /* try to push the defintion */
return new;
/* conflict appears */
if (old->rec.fields) /* if the old one is complete */
ERROR((new->ast, "redefinition of '%s'", new->name));
/* otherwise incomplete, thus complete the type */
old->rec.fields = new->rec.fields;
old->ast = new->ast;
free(new);
return old;
}
static void type_merge(CType_t old, CType_t new) {
/* assume old and new are the same type */
assert(old->type == new->type);
switch (old->type)
{
case CINT: case CCHAR: case CPTR:
case CUNION: case CSTRUCT:
break;
case CFUNC:
if (new->rec.func.params)
old->rec.func.params = new->rec.func.params;
if (new->rec.func.body)
{
old->rec.func.local = new->rec.func.local;
old->rec.func.body = new->rec.func.body;
}
break;
default: assert(0);
}
}
int is_same_type(CType_t typea, CType_t typeb) {
if (typea == typeb) return 1;
if (typea->type != typeb->type) return 0;
switch (typea->type)
{
case CSTRUCT: case CUNION:
return typea == typeb;
case CARR:
if (typea->rec.arr.len != typeb->rec.arr.len)
return 0;
return is_same_type(typea->rec.arr.elem, typeb->rec.arr.elem);
case CPTR:
return is_same_type(typea->rec.ref, typeb->rec.ref);
case CFUNC:
{
CVar_t pa = typea->rec.func.params,
pb = typeb->rec.func.params;
if ((pa || typea->rec.func.body) &&
(pb || typeb->rec.func.body))
{
for (;pa && pb; pa = pa->next, pb = pb->next)
if (!is_same_type(pa->type, pb->type))
return 0;
if (pa || pb)
return 0; /* different number of parameters */
}
return is_same_type(typea->rec.func.ret, typeb->rec.func.ret);
}
case CINT: case CCHAR: case CVOID:
;
break;
}
return 1;
}
static CVar_t var_merge(CVar_t new, CScope_t scope) {
CVar_t old;
if (cscope_push_var(scope, new, NS_ID))
return new;
else
old = cscope_lookup(scope, new->name, NS_ID)->rec.var;
if (!is_same_type(old->type, new->type))
ERROR((new->ast, "conflicting types of '%s'", new->name));
else if (scope->lvl)
ERROR((new->ast, "redeclaration of '%s' with no linkage", new->name));
type_merge(old->type, new->type);
free(new);
return old;
}
CTable_t semantics_fields(CNode *, CScope_t scope);
CType_t semantics_type_spec(CNode *p, CScope_t scope) {
CHECK_TYPE(p, TYPE_SPEC);
CType_t type;
switch (p->rec.subtype)
{
case KW_VOID:
type = ctype_create("", CVOID, p); break;
case KW_CHAR:
type = ctype_create("", CCHAR, p); break;
case KW_INT:
type = ctype_create("", CINT, p); break;
case KW_STRUCT: case KW_UNION:
{
CNode *id = p->chd,
*fields = p->chd->next;
type = ctype_create(id->type == NOP ? "" : id->rec.strval,
p->rec.subtype == KW_STRUCT ? CSTRUCT : CUNION,
p);
if (fields->type == NOP)
type->rec.fields = NULL; /* incomplete type */
else
type->rec.fields = semantics_fields(fields, scope);
if (id->type != NOP)
type = struct_type_merge(type, scope);
}
break;
default: assert(0);
}
return type;
}
int type_is_complete(CType_t type) {
switch(type->type)
{
case CINT: case CCHAR:
/* basic types are always complete */
case CPTR:
/* pointer may point to an incomplete type */
case CARR:
/* syntax of incomplete arrays is not allowed in `cibic.y` */
return 1;
case CSTRUCT: case CUNION:
/* fields are guaranteed to be complete if exists, due to
* `semantics_fields` */
return type->rec.fields != NULL;
case CVOID:
/* void type is never complete */
return 0;
case CFUNC:
/* function body is not required here, it is checked in the last
* phase */
return 1;
default: assert(0);
}
return 1;
}
CVar_t semantics_declr(CNode *, CType_t, CScope_t, int);
CVar_t semantics_p_decl(CNode *p, CScope_t scope) {
CHECK_TYPE(p, PLAIN_DECL);
CVar_t var = semantics_declr(p->chd->next,
semantics_type_spec(p->chd, scope),
scope, 0);
return var;
}
CVar_t semantics_params(CNode *p, CScope_t scope) {
CHECK_TYPE(p, PARAMS);
p = p->chd;
if (!p) return NULL; /* no parameters */
CVar_t params = semantics_p_decl(p, scope), tail = params;
#ifdef CIBIC_DEBUG
CTable_t tparams = ctable_create(bkdr_hash, ctable_cvar_print);
#else
CTable_t tparams = ctable_create(bkdr_hash);
#endif
FUNC_POINTER_CONV(params->type);
ctable_insert(tparams, params->name, params, 0);
for (p = p->next; p; p = p->next)
{
CVar_t var = semantics_p_decl(p, scope);
FUNC_POINTER_CONV(var->type);
if (scope) /* params inside a function definition */
if (!ctable_insert(tparams, var->name, var, 0))
ERROR((var->ast, "redefinition of parameter '%s'", var->name));
tail->next = var;
tail = var;
}
ctable_destory(tparams);
tail->next = NULL;
return params;
}
ExpType semantics_exp(CNode *, CScope_t);
CVar_t semantics_declr(CNode *p, CType_t type_spec, CScope_t scope, int func_chk) {
CVar_t type;
if (p->type == ID)
{
if (!func_chk) CHECK_CVOID(p->rec.strval, p);
return cvar_create(p->rec.strval, type_spec, p);
}
if (p->type == NOP) /* type name */
return cvar_create(NULL, type_spec, p);
switch (p->rec.subtype)
{
case DECLR_FUNC:
{
CType_t func = ctype_create("", CFUNC, p); /* function declr */
cscope_enter(scope);
func->rec.func.params = semantics_params(p->chd->next, scope);
cscope_exit(scope);
/* incomplete type */
func->rec.func.local = NULL;
func->rec.func.ret = type_spec; /* might be an incomplete type */
func->rec.func.body = NULL; /* not a definition */
type = semantics_declr(p->chd, func, scope, 1);
if (type_spec->type == CARR)
ERROR((p, "'%s' declared as function returning an array", type->name));
if (type_spec->type == CFUNC)
ERROR((p, "'%s' declared as function returing a function", type->name));
}
break;
case DECLR_ARR:
{
CType_t arr = ctype_create("", CARR, p); /* array declr */
CNode *rch = p->chd->next;
ExpType tl = semantics_exp(rch, scope);
if (!type_is_complete(type_spec))
ERROR((p, "array type has incomplete element type"));
if (!rch->ext.is_const)
ERROR((p, "size of array must be a constant"));
if (!IS_INT(tl.type->type))
ERROR((p, "size of array has non-integer type"));
arr->rec.arr.elem = type_spec;
arr->rec.arr.len = rch->ext.const_val;
type = semantics_declr(p->chd, arr, scope, 0);
}
break;
case '*':
{
CType_t ptr = ctype_create("", CPTR, p); /* pointer */
ptr->rec.ref = type_spec;
type = semantics_declr(p->chd, ptr, scope, 0);
}
break;
default: assert(0);
}
return type;
}
CTable_t semantics_fields(CNode *p, CScope_t scope) {
#ifdef CIBIC_DEBUG
CTable_t ct = ctable_create(bkdr_hash, ctable_cvar_print);
#else
CTable_t ct = ctable_create(bkdr_hash);
#endif
for (p = p->chd; p; p = p->next)
{
CNode *declr = p->chd->next->chd;
for (; declr; declr = declr->next)
{
CVar_t var = semantics_declr(declr,
semantics_type_spec(p->chd, scope),
scope, 0);
/* types of fields are supposed to be complete */
if (!type_is_complete(var->type))
ERROR((var->ast, "field '%s' has incomplete type", var->name));
if (var->type->type == CFUNC)
ERROR((var->ast, "field '%s' declared as a function", var->name));
if (!ctable_insert(ct, var->name, var, 0))
ERROR((p, "duplicate member '%s'", var->name));
}
}
return ct;
}
static void exp_check_aseq_(CType_t lhs, CType_t rhs, CNode *ast) {
NOT_IGNORE_VOID(lhs, ast);
NOT_IGNORE_VOID(rhs, ast);
switch (lhs->type)
{
case CSTRUCT: case CUNION:
if (!is_same_type(lhs, rhs))
INCOMP_TYPE(ast);
break;
case CARR: case CFUNC: /* constant */
INCOMP_TYPE(ast);
break;
case CINT: case CCHAR:
switch (rhs->type)
{
case CINT: case CCHAR:
; break; /* ok */
case CPTR: case CARR:
WARNING((ast, "assignment makes integer from pointer without a cast"));
break;
default: INCOMP_TYPE(ast);
}
break;
case CPTR:
switch (rhs->type)
{
case CPTR: case CARR:
if (!is_same_type(lhs->rec.ref, rhs->rec.ref))
WARNING((ast, "assignment from incompatible pointer type"));
break;
case CINT: case CCHAR:
WARNING((ast, "assignment makes pointer from integer without a cast"));
break;
default: INCOMP_TYPE(ast);
}
break;
default: assert(0);
}
}
void semantics_initr(CNode *p, CScope_t scope, CType_t type) {
switch (p->rec.subtype)
{
case INITR_NORM:
{
ExpType et = semantics_exp(p->chd, scope);
if (!scope->lvl && !p->chd->ext.is_const) /* in global scope */
ERROR((p->chd, "initializer element is not constant"));
exp_check_aseq_(type, et.type, p);
}
break;
case INITR_ARR:
{
if (type->type == CARR)
{
/* warning if declr is not an array */
type = type->rec.arr.elem;
}
for (p = p->chd; p; p = p->next)
semantics_initr(p, scope, type);
}
break;
}
}
CVar_t semantics_decl(CNode *p, CScope_t scope) {
CHECK_TYPE(p, DECL);
CNode *declr = p->chd->next;
CType_t type = semantics_type_spec(p->chd, scope);
CVar_t res = NULL;
int useful = 0;
if ((type->type == CSTRUCT || type->type == CUNION) &&
(*type->name) != '\0')
{
cscope_push_type(scope, type, NS_TAG);
useful = 1;
}
if (declr->chd->type != NOP)
{
CNode *p;
for (p = declr->chd; p; p = p->next)
{
CNode *initr = p->chd->next;
CVar_t var = semantics_declr(p->chd, type, scope, 0);
if (var->type->type == CFUNC)
{
CType_t func = var->type;
func->name = var->name;
if (!cscope_push_type(scope, func, NS_ID))
{
CSymbol_t lu = cscope_lookup(scope, func->name, NS_ID);
if (lu->kind != CTYPE)
ERROR((func->ast, "'%s' redeclared as different kind of symbol", func->name));
if (!is_same_type(lu->rec.type, func))
ERROR((func->ast, "conflicting types of '%s'", func->name));
type_merge(lu->rec.type, func);
}
if (initr->type == INITR)
ERROR((var->ast, "function '%s' is initialized like a variable", func->name));
}
else
{
if (scope->lvl && !type_is_complete(var->type))
ERROR((var->ast, "storage size of '%s' isn’t known", var->name));
var = var_merge(var, scope);
var->next = res;
res = var;
/* check initializer */
if (initr->type == INITR)
semantics_initr(initr, scope, var->type);
}
}
useful = 1;
}
if (!useful)
/* useless typename warning */
WARNING((type->ast, "useless declaration"));
return res;
}
ExpType exp_check_aseq(ExpType lhs, ExpType rhs, CNode *ast) {
exp_check_aseq_(lhs.type, rhs.type, ast);
return lhs;
}
ExpType semantics_cast(CNode *p, CScope_t scope) {
CNode *chd = p->chd->next;
ExpType op = semantics_exp(chd, scope);
CVar_t var = semantics_declr(p->chd->chd->next,
semantics_type_spec(p->chd->chd, scope),
scope, 0);
CType_t type = var->type;
free(var);
if (!IS_SCALAR(type->type))
ERROR((p, "conversion to non-scalar type requested"));
if (!IS_SCALAR(op.type->type))
ERROR((p, "aggregate value used where a scalar was expected"));
if (type->type == CARR)
ERROR((p, "cast specifies array type"));
if (type->type == CFUNC)
ERROR((p, "cast specifies function type"));
type->ast = p;
op.type = type;
op.lval = 0;
if ((p->ext.is_const &= !IS_INT(type->type)))
{
p->ext.const_val = chd->ext.const_val;
}
return op;
}
ExpType exp_check_arith(ExpType op1, ExpType op2, CNode *p, char kind) {
CNode *lch = p->chd,
*rch = lch->next;
int t1 = op1.type->type,
t2 = op2.type->type;
ExpType res;
NOT_IGNORE_VOID(op1.type, p);
NOT_IGNORE_VOID(op2.type, p);
res.lval = 0;
res.type = basic_type_int;
if ((p->ext.is_const = lch->ext.is_const && rch->ext.is_const))
{
int l = lch->ext.const_val,
r = rch->ext.const_val,
*a = &(p->ext.const_val);
switch (kind)
{
case '*': *a = l * r; break;
case '/': *a = l / r; break;
case '%': *a = l % r; break;
}
}
if (!(IS_ARITH(t1) && IS_ARITH(t2)))
ERROR((p, "invalid operands to binary operator"));
return res;
}
ExpType exp_check_bitwise(ExpType op1, ExpType op2, CNode *p, char kind) {
CNode *lch = p->chd,
*rch = lch->next;
int t1 = op1.type->type,
t2 = op2.type->type;
ExpType res;
NOT_IGNORE_VOID(op1.type, p);
NOT_IGNORE_VOID(op2.type, p);
res.lval = 0;
res.type = basic_type_int;
if ((p->ext.is_const = lch->ext.is_const && rch->ext.is_const))
{
int l = lch->ext.const_val,
r = rch->ext.const_val,
*a = &(p->ext.const_val);
switch (kind)
{
case 'l': *a = l << r; break;
case 'r': *a = l >> r; break;
case '&': *a = l & r; break;
case '|': *a = l | r; break;
case '^': *a = l ^ r; break;
}
}
if (!(IS_INT(t1) && IS_INT(t2)))
ERROR((p, "invalid operands to binary operator"));
return res;
}
ExpType exp_check_add(ExpType op1, ExpType op2, CNode *p, char kind) {
CNode *lch = p->chd,
*rch = lch->next;
int t1 = op1.type->type,
t2 = op2.type->type;
NOT_IGNORE_VOID(op1.type, p);
NOT_IGNORE_VOID(op2.type, p);
if (kind == '+' && IS_PTR(t2))
{
/* place the pointer type in the first place */
int t = t1;
ExpType te = op1;
t1 = t2;
t2 = t;
op1 = op2;
op2 = te;
CNode *n1 = p->chd;
CNode *n2 = n1->next;
n2->next = n1;
n1->next = NULL;
p->chd = n2;
}
if (kind == '-')
{
if (IS_PTR(t2) && !IS_PTR(t1))
ERROR((p, "invalid operands to binary operator"));
}
else
{
if (!((IS_INT(t1) || IS_PTR(t1)) && IS_INT(t2)))
ERROR((p, "invalid operands to binary operator"));
}
if ((p->ext.is_const = lch->ext.is_const && rch->ext.is_const))
{
int l = lch->ext.const_val,
r = rch->ext.const_val,
*a = &(p->ext.const_val);
if (!IS_PTR(t1) && !IS_PTR(t2))
switch (kind)
{
case '+': *a = l + r; break;
case '-': *a = l - r; break;
}
else
{
/* TODO: constant pointer folding */
}
}
op1.lval = 0;
return op1; /* int or pointer */
}
ExpType exp_check_int(ExpType op1, CNode *p) {
if (!IS_INT(op1.type->type))
ERROR((p, "wrong type argument to unary operator"));
op1.lval = 0;
return op1;
}
ExpType exp_check_scalar(ExpType op1, CNode *p) {
if (!IS_SCALAR(op1.type->type))
ERROR((p, "wrong type argument to unary operator"));
op1.lval = 0;
return op1;
}
ExpType exp_check_deref(ExpType op1, CNode *p) {
if (!IS_PTR(op1.type->type))
ERROR((p, "invalid type argument of unary '*'"));
if (op1.type->rec.ref->type == CFUNC)
return op1;
op1.lval = 1; /* deref changes exp to lval */
if (!type_is_complete(op1.type = op1.type->rec.ref))
ERROR((p, "dereferencing pointer to incomplete type"));
return op1;
}
ExpType exp_check_ref(ExpType op1, CNode *p) {
ExpType res;
CType_t t = op1.type;
if (t->type == CARR || (t->type == CPTR && t->rec.ref->type == CFUNC))
return op1;
if (!op1.lval)
ERROR((p, "lvalue required as unary '&' operand"));
/* TODO: constant pointer folding */
p->ext.is_const = 0;
/* should be constant */
res.lval = 0;
res.type = ctype_create("", CPTR, p);
res.type->rec.ref = op1.type;
return res;
}
ExpType exp_check_sizeof(CNode *p, CScope_t scope) {
if (p->chd->type == EXP)
semantics_exp(p->chd, scope);
ExpType res;
res.lval = 0;
res.type = basic_type_int;
return res;
}
ExpType exp_check_inc(ExpType op1, CNode *p) {
if (!IS_SCALAR(op1.type->type))
ERROR((p, "wrong type argument to increment/decrement"));
if (!op1.lval)
ERROR((p, "lvalue required as increment/decrement operand"));
return op1;
}
ExpType exp_check_logical(ExpType op1, ExpType op2, CNode *p, char kind) {
CNode *lch = p->chd,
*rch = lch->next;
int t1 = op1.type->type,
t2 = op2.type->type;
ExpType res;
NOT_IGNORE_VOID(op1.type, p);
NOT_IGNORE_VOID(op2.type, p);
res.lval = 0;
res.type = basic_type_int;
if ((p->ext.is_const = lch->ext.is_const && rch->ext.is_const))
{
int l = lch->ext.const_val,
r = rch->ext.const_val,
*a = &(p->ext.const_val);
switch (kind)
{
case '&': *a = l && r; break;
case '|': *a = l || r; break;
}
}
if (!(IS_SCALAR(t1) && IS_SCALAR(t2)))
ERROR((p, "invalid operands to binary operator"));
return res;
}
ExpType exp_check_ass(ExpType lhs, ExpType rhs, CNode *p) {
NOT_IGNORE_VOID(lhs.type, p);
NOT_IGNORE_VOID(rhs.type, p);
if (!lhs.lval)
ERROR((p, "lvalue required as left operand of assignment"));
switch (p->rec.subtype)
{
case '=' : return exp_check_aseq(lhs, rhs, p);
case ASS_MUL: return exp_check_aseq(lhs, exp_check_arith(lhs, rhs, p, '*'), p);
case ASS_DIV: return exp_check_aseq(lhs, exp_check_arith(lhs, rhs, p, '/'), p);
case ASS_MOD: return exp_check_aseq(lhs, exp_check_arith(lhs, rhs, p, '%'), p);
case ASS_ADD: return exp_check_aseq(lhs, exp_check_add(lhs, rhs, p, '+'), p);
case ASS_SUB: return exp_check_aseq(lhs, exp_check_add(lhs, rhs, p, '-'), p);
case ASS_SHL: return exp_check_aseq(lhs, exp_check_bitwise(lhs, rhs, p, 'l'), p);
case ASS_SHR: return exp_check_aseq(lhs, exp_check_bitwise(lhs, rhs, p, 'r'), p);
case ASS_AND: return exp_check_aseq(lhs, exp_check_bitwise(lhs, rhs, p, '&'), p);
case ASS_XOR: return exp_check_aseq(lhs, exp_check_bitwise(lhs, rhs, p, '^'), p);
case ASS_OR: return exp_check_aseq(lhs, exp_check_bitwise(lhs, rhs, p, '|'), p);
default: assert(0);
}
}
ExpType exp_check_equality(ExpType op1, ExpType op2, CNode *p, int kind) {
CNode *lch = p->chd,
*rch = lch->next;
int t1 = op1.type->type,
t2 = op2.type->type;
ExpType res;
NOT_IGNORE_VOID(op1.type, p);
NOT_IGNORE_VOID(op2.type, p);
res.lval = 0;
res.type = basic_type_int;
if ((p->ext.is_const = lch->ext.is_const && rch->ext.is_const))
{
int l = lch->ext.const_val,
r = rch->ext.const_val,
*a = &(p->ext.const_val);
switch (kind)
{
case OPT_EQ: *a = l == r; break;
case OPT_NE: *a = l != r; break;
case '>': *a = l > r; break;
case '<': *a = l < r; break;
case OPT_LE: *a = l <= r; break;
case OPT_GE: *a = l >= r; break;
}
}
if (IS_ARITH(t1) && IS_ARITH(t2))
return res;
if (!(IS_SCALAR(t1) && IS_SCALAR(t2)))
ERROR((p, "invalid operands to binary operator"));
if (IS_PTR(t1) && IS_PTR(t2))
{
if (!is_same_type(op1.type->rec.ref, op2.type->rec.ref))
WARNING((p, "comparison of distinct pointer types lacks a cast"));
}
else if (IS_PTR(t1) || IS_PTR(t2))
WARNING((p, "comparison between pointer and integer"));
return res;
}
ExpType exp_check_postfix(CNode *p, CScope_t scope) {
CNode *post = p->chd->next;
ExpType op1 = semantics_exp(p->chd, scope), op2;
int t1 = op1.type->type, t2;
switch (post->rec.subtype)
{
case POSTFIX_ARR:
if (!IS_PTR(t1))
ERROR((p, "subscripted value is neither array nor pointer"));
op2 = semantics_exp(post->chd, scope);
t2 = op2.type->type;
if (!IS_INT(t2))
ERROR((p, "array subscript is not an integer"));
op1.type = op1.type->rec.arr.elem;
op1.lval = 1;
break;
case POSTFIX_CALL:
if (!(t1 == CPTR && op1.type->rec.ref->type == CFUNC))
ERROR((p, "called object is not a function"));
{
CNode *arg = post->chd->chd;
CType_t func = p->chd->ext.type;
CVar_t param;
/* pointer to function */
if (func->type == CPTR) func = func->rec.ref;
if ((param = func->rec.func.params))
{
for (; arg && param;
arg = arg->next, param = param->next)
{
semantics_exp(arg, scope);
exp_check_aseq_(param->type, arg->ext.type, arg);
}
if (arg || param)
ERROR((p, "too many/few arguments to the function"));
}
op1.type = func->rec.func.ret;
op1.lval = 0;
break;
}
case POSTFIX_DOT:
if (!(t1 == CSTRUCT || t1 == CUNION))
ERROR((p, "request for the member in something not a structure or union"));
{
CVar_t fv = ctable_lookup(op1.type->rec.fields, post->chd->rec.strval);
if (!fv)
ERROR((p, "struct/union has no member named '%s'", post->chd->rec.strval));
p->ext.var = fv;
op1.type = fv->type;
op1.lval = 1;
}
break;
case POSTFIX_PTR:
if (t1 != CPTR)
ERROR((p, "invalid type argument of '->'"));
{
CType_t tref = op1.type->rec.ref;
if (!(tref->type == CSTRUCT || tref->type == CUNION))
ERROR((p, "request for the member in something not a structure or union"));
if (!tref->rec.fields)
ERROR((p, "dereferencing pointer to incomplete type"));
CVar_t fv = ctable_lookup(tref->rec.fields, post->chd->rec.strval);
if (!fv)
ERROR((p, "struct/union has no member named '%s'", post->chd->rec.strval));
p->ext.var = fv;
op1.type = fv->type;
op1.lval = 1;
}
break;
case OPT_INC: case OPT_DEC:
exp_check_inc(op1, p);
break;
default: assert(0);
}
return op1;
}
ExpType semantics_exp(CNode *p, CScope_t scope) {
ExpType res;
switch (p->type)
{
case ID:
{
CSymbol_t lu = cscope_lookup(scope, p->rec.strval, NS_ID);
if (!lu) ERROR((p, "'%s' undeclared", p->rec.strval));
if (lu->kind == CVAR)
{
p->ext.var = lu->rec.var;
res.type = p->ext.var->type;
res.lval = res.type->type != CARR;
}
else
{
p->ext.type = lu->rec.type;
res.type = p->ext.type;
res.lval = res.type->type == CFUNC;
FUNC_POINTER_CONV(res.type);
}
p->ext.is_const = 0;
}
break;
case INT:
res.type = basic_type_int;
res.lval = 0;
p->ext.is_const = 1;
p->ext.const_val = p->rec.intval;
break;
case CHAR:
res.type = basic_type_char;
res.lval = 0;
p->ext.is_const = 1;
p->ext.const_val = p->rec.intval;
break;
case STR:
{
CType_t type = ctype_create("", CPTR, NULL);
type->rec.ref = basic_type_char;
res.type = type;
res.lval = 0;
p->ext.is_const = 1;
p->ext.const_val = (long int)p->rec.strval;
}
break;
case EXP:
{
ExpType op1;
ExpType op2;
switch (p->rec.subtype)
{
case EXP_CAST:
res = semantics_cast(p, scope);
break;
case EXP_POSTFIX:
res = exp_check_postfix(p, scope);
break;
case KW_SIZEOF:
res = exp_check_sizeof(p, scope);
break;
default:
{
op1 = semantics_exp(p->chd, scope);
if (p->chd->next)
op2 = semantics_exp(p->chd->next, scope);
switch (p->rec.subtype)
{
/* following cases are binary expressions */
case ',':
res = op2;
res.lval = 0;
break;
case '=' :
case ASS_MUL:
case ASS_DIV:
case ASS_MOD:
case ASS_ADD:
case ASS_SUB:
case ASS_SHL:
case ASS_SHR:
case ASS_AND:
case ASS_XOR:
case ASS_OR:
res = exp_check_ass(op1, op2, p);
break;
case OPT_OR:
res = exp_check_logical(op1, op2, p, '|');
break;
case OPT_AND:
res = exp_check_logical(op1, op2, p, '&');
break;
case OPT_SHL:
case OPT_SHR:
case '|':
case '^':
res = exp_check_bitwise(op1, op2, p, p->rec.subtype);
break;
case OPT_EQ:
case OPT_NE:
case '<':
case '>' :
case OPT_LE:
case OPT_GE:
res = exp_check_equality(op1, op2, p, p->rec.subtype);
break;
case '/':
case '%':
res = exp_check_arith(op1, op2, p, p->rec.subtype);
break;
case '&':
if (p->chd->next)
res = exp_check_bitwise(op1, op2, p, '&');
else
res = exp_check_ref(op1, p);
break;
case '*':
if (p->chd->next)
res = exp_check_arith(op1, op2, p, '*');
else
res = exp_check_deref(op1, p);
break;
case '+':
if (p->chd->next)
res = exp_check_add(op1, op2, p, '+');
else
{
res = op1;
res.lval = 0;
}
break;
case '-':
if (p->chd->next)
res = exp_check_add(op1, op2, p, '-');
else
{
res = op1;
res.lval = 0;
}
break;
case '~':
res = exp_check_int(op1, p);
break;
case '!':
res = exp_check_scalar(op1, p);
break;
case OPT_INC: case OPT_DEC:
res = exp_check_inc(op1, p);
break;
default:
printf("%d\n", p->rec.subtype);
assert(0);
}
}
}
}
break;
case NOP: ; break;
default: assert(0);
}
p->ext.type = res.type;
return res;
}
CVar_t semantics_stmt(CNode *p, CScope_t scope);
CVar_t semantics_if(CNode *p, CScope_t scope) {
ExpType exp = semantics_exp(p->chd, scope);
CNode *body1 = p->chd->next,
*body2 = body1->next;
CVar_t res;
if (!IS_SCALAR(exp.type->type))
ERROR((p->chd, "a scalar is required in 'if' condition"));
cscope_enter(scope);
res = semantics_stmt(body1, scope);
cscope_exit(scope);
if (body2->type != NOP)
{
CVar_t t;
cscope_enter(scope);
if ((t = semantics_stmt(p->chd->next->next, scope)))
{
t->next = res;
res = t;
}
cscope_exit(scope);
}
return res;
}
CVar_t semantics_for(CNode *p, CScope_t scope) {
ExpType exp = semantics_exp(p->chd->next, scope);
semantics_exp(p->chd, scope);
semantics_exp(p->chd->next->next, scope);
CVar_t res;
if (p->chd->next->type != NOP && !IS_SCALAR(exp.type->type))
ERROR((p->chd->next, "a scalar is required in 'for' condition"));
cscope_enter(scope);
scope->inside_loop++;
res = semantics_stmt(p->chd->next->next->next, scope);
scope->inside_loop--;
cscope_exit(scope);
return res;
}
CVar_t semantics_while(CNode *p, CScope_t scope) {
ExpType exp = semantics_exp(p->chd, scope);
CVar_t res;
if (!IS_SCALAR(exp.type->type))
ERROR((p->chd, "a scalar is required in 'while' condition"));
cscope_enter(scope);
scope->inside_loop++;
res = semantics_stmt(p->chd->next, scope);
scope->inside_loop--;
cscope_exit(scope);
return res;
}
CVar_t semantics_check_loop(CNode *p, CScope_t scope, const char *stmt_name) {
if (!scope->inside_loop)
ERROR((p, "%s statement not within a loop", stmt_name));
return NULL;
}
CVar_t semantics_return(CNode *p, CScope_t scope) {
assert(scope->func);
CType_t rt = scope->func->rec.func.ret;
if (p->chd->type != NOP)
{
ExpType t = semantics_exp(p->chd, scope);
if (rt->type == CVOID)
{
if (t.type->type != CVOID)
WARNING((p->chd, "'return' with a value, in function returning void"));
}
else
exp_check_aseq_(rt, p->chd->ext.type, p->chd);
}
return NULL;
}
CVar_t semantics_comp(CNode *, CScope_t);
CVar_t semantics_stmt(CNode *p, CScope_t scope) {
CHECK_TYPE(p, STMT);
switch (p->rec.subtype)
{
case STMT_EXP:
semantics_exp(p->chd, scope);
break;
case STMT_COMP:
{
CVar_t res;
cscope_enter(scope);
res = semantics_comp(p, scope);
cscope_exit(scope);
return res;
}
case STMT_IF:
return semantics_if(p, scope);
case STMT_FOR:
return semantics_for(p, scope);
case STMT_WHILE:
return semantics_while(p, scope);
case STMT_CONT:
return semantics_check_loop(p, scope, "continue");
case STMT_BREAK:
return semantics_check_loop(p, scope, "break");
case STMT_RET:
return semantics_return(p, scope);
default: assert(0);
}
return NULL;
}
CVar_t semantics_comp(CNode *p, CScope_t scope) {
CNode *decls = p->chd,
*stmts = p->chd->next, *i;
CVar_t res = NULL;
if (decls->chd->type != NOP)
for (i = decls->chd; i; i = i->next)
{
CVar_t vlist = semantics_decl(i, scope);
if (vlist) /* collect local vars */
{
CVar_t p;
for (p = vlist; p->next; p = p->next);
p->next = res;
res = vlist;
}
}
if (stmts->chd->type != NOP)
for (i = stmts->chd; i; i = i->next)
{
CVar_t vlist = semantics_stmt(i, scope);
if (vlist) /* collect nested local vars */
{
CVar_t p;
for (p = vlist; p->next; p = p->next);
p->next = res;
res = vlist;
}
}
return res;
}
CType_t semantics_func(CNode *p, CScope_t scope) {
CHECK_TYPE(p, FUNC_DEF);
CVar_t head = semantics_declr(p->chd->next,
semantics_type_spec(p->chd, scope),
scope, 0);
CType_t func = head->type, efunc;
CType_t rt = func->rec.func.ret;
if (rt->type != CVOID && !type_is_complete(rt))
ERROR((func->rec.func.ret->ast, "return type is an incomplete type"));
scope->func = func;
func->rec.func.body = p->chd->next->next;
func->name = head->name;
free(head);
cscope_enter(scope); /* enter function local scope */
{ /* Note: here is a dirty hack to forcibly push function definition to
the global scope, while all the types specified in parameters retain in local scope.
The key point is to make sure semantics_params does not push any var */
CSNode *ntop = scope->top;
CVar_t var;
scope->top = ntop->next;
scope->lvl--;
if (!cscope_push_type(scope, func, NS_ID))
{
CSymbol_t lu = cscope_lookup(scope, func->name, NS_ID);
if (lu->kind != CTYPE)
ERROR((func->ast, "'%s' redeclared as different kind of symbol", func->name));
efunc = lu->rec.type;
if (efunc->type != CFUNC)
ERROR((func->ast, "conflicting types of '%s'", func->name));
else if (efunc->rec.func.body)
ERROR((func->ast, "redefintion of function '%s'", func->name));
else if (!is_same_type(efunc, func))
ERROR((func->ast, "function defintion does not match the prototype"));
type_merge(efunc, func);
free(func);
}
scope->top = ntop;
scope->lvl++;
for (var = func->rec.func.params; var; var = var->next)
{
cscope_push_var(scope, var, NS_ID);
if (!type_is_complete(var->type))
ERROR((var->ast, "parameter '%s' has incomplete type", var->name));
}
}
func->rec.func.local = semantics_comp(p->chd->next->next, scope); /* check comp */
cscope_exit(scope); /* exit from local scope */
return func;
}
CType_t make_builtin_func(const char *name, CType_t rt) {
CType_t func = ctype_create(name, CFUNC, NULL);
func->rec.func.params = NULL;
func->rec.func.body = NULL;
func->rec.func.local = NULL;
func->rec.func.ret = rt;
return func;
}
void semantics_check(CNode *p) {
CScope_t scope = cscope_create();
basic_type_int = ctype_create("int", CINT, NULL);
basic_type_char = ctype_create("char", CCHAR, NULL);
basic_type_void = ctype_create("void", CVOID, NULL);
builtin_printf = make_builtin_func("printf", basic_type_int);
builtin_scanf = make_builtin_func("scanf", basic_type_int);
{
CType_t vstar = ctype_create("", CPTR, NULL);
vstar->rec.ref = basic_type_void;
builtin_malloc = make_builtin_func("malloc", vstar);
}
/* add top-level basic types */
cscope_push_type(scope, basic_type_int, NS_TAG);
cscope_push_type(scope, basic_type_char, NS_TAG);
cscope_push_type(scope, basic_type_void, NS_TAG);
cscope_push_type(scope, builtin_printf, NS_ID);
cscope_push_type(scope, builtin_scanf, NS_ID);
cscope_push_type(scope, builtin_malloc, NS_ID);
/* check all definitions and declarations */
for (p = p->chd; p; p = p->next)
{
switch (p->type)
{
case FUNC_DEF:
semantics_func(p, scope); break;
case DECL:
semantics_decl(p, scope); break;
default: assert(0);
}
}
cscope_debug_print(scope);
{
CTNode *p;
int i;
for (i = 0; i < MAX_TABLE_SIZE; i++)
for (p = scope->ids->head[i]; p; p = p->next)
{
CSymbol_t tp = (CSymbol_t)(p->val);
if (tp->kind == CVAR)
cvar_print(tp->rec.var);
else
ctype_print(tp->rec.type);
fprintf(stderr, "\n");
}
for (i = 0; i < MAX_TABLE_SIZE; i++)
for (p = scope->tags->head[i]; p; p = p->next)
{
CSymbol_t tp = (CSymbol_t)(p->val);
if (tp->kind == CVAR)
cvar_print(tp->rec.var);
else
ctype_print(tp->rec.type);
fprintf(stderr, "\n");
}
}
cnode_debug_print(ast_root, 1);
}