gmqcc/parser.c

679 lines
18 KiB
C
Raw Normal View History

2012-07-16 12:52:52 +00:00
#include <stdio.h>
#include <stdarg.h>
2012-07-16 11:59:10 +00:00
#include "gmqcc.h"
#include "lexer.h"
2012-07-16 12:14:37 +00:00
typedef struct {
lex_file *lex;
int tok;
2012-07-16 12:52:52 +00:00
MEM_VECTOR_MAKE(ast_value*, globals);
MEM_VECTOR_MAKE(ast_function*, functions);
MEM_VECTOR_MAKE(ast_value*, imm_float);
ast_function *function;
MEM_VECTOR_MAKE(ast_value*, locals);
size_t blocklocal;
2012-07-16 12:14:37 +00:00
} parser_t;
2012-07-16 12:52:52 +00:00
MEM_VEC_FUNCTIONS(parser_t, ast_value*, globals)
MEM_VEC_FUNCTIONS(parser_t, ast_value*, imm_float)
MEM_VEC_FUNCTIONS(parser_t, ast_value*, locals)
MEM_VEC_FUNCTIONS(parser_t, ast_function*, functions)
2012-07-16 12:52:52 +00:00
void parseerror(parser_t *parser, const char *fmt, ...)
{
va_list ap;
if (parser)
printf("error %s:%lu: ", parser->lex->tok->ctx.file, (unsigned long)parser->lex->tok->ctx.line);
else
printf("error: ");
va_start(ap, fmt);
vprintf(fmt, ap);
va_end(ap);
printf("\n");
}
bool parser_next(parser_t *parser)
{
/* lex_do kills the previous token */
parser->tok = lex_do(parser->lex);
if (parser->tok == TOKEN_EOF || parser->tok >= TOKEN_ERROR)
return false;
return true;
}
/* lift a token out of the parser so it's not destroyed by parser_next */
token *parser_lift(parser_t *parser)
{
token *tok = parser->lex->tok;
parser->lex->tok = NULL;
return tok;
}
#define parser_tokval(p) (p->lex->tok->value)
#define parser_token(p) (p->lex->tok)
#define parser_ctx(p) (p->lex->tok->ctx)
ast_value* parser_const_float(parser_t *parser, double d)
{
size_t i;
ast_value *out;
for (i = 0; i < parser->imm_float_count; ++i) {
if (parser->imm_float[i]->constval.vfloat == d)
return parser->imm_float[i];
}
out = ast_value_new(parser_ctx(parser), "#IMMEDIATE", TYPE_FLOAT);
out->isconst = true;
out->constval.vfloat = d;
if (!parser_t_imm_float_add(parser, out)) {
ast_value_delete(out);
return NULL;
}
return out;
}
2012-07-16 12:52:52 +00:00
ast_value* parser_find_global(parser_t *parser, const char *name)
{
size_t i;
for (i = 0; i < parser->globals_count; ++i) {
if (!strcmp(parser->globals[i]->name, name))
return parser->globals[i];
}
return NULL;
}
ast_value* parser_find_local(parser_t *parser, const char *name, size_t upto)
{
size_t i;
for (i = parser->locals_count; i > upto;) {
--i;
if (!strcmp(parser->locals[i]->name, name))
return parser->locals[i];
}
return NULL;
}
ast_value* parser_find_var(parser_t *parser, const char *name)
{
ast_value *v;
v = parser_find_local(parser, name, 0);
if (!v) v = parser_find_global(parser, name);
return v;
}
typedef struct {
MEM_VECTOR_MAKE(ast_value*, p);
} paramlist_t;
MEM_VEC_FUNCTIONS(paramlist_t, ast_value*, p)
static ast_value *parser_parse_type(parser_t *parser, int basetype, bool *isfunc)
{
paramlist_t params;
ast_value *var;
lex_ctx ctx = parser_ctx(parser);
int vtype = basetype;
int temptype;
MEM_VECTOR_INIT(&params, p);
*isfunc = false;
if (parser->tok == '(') {
*isfunc = true;
while (true) {
ast_value *param;
bool dummy;
if (!parser_next(parser)) {
MEM_VECTOR_CLEAR(&params, p);
return NULL;
}
if (parser->tok == ')')
break;
temptype = parser_token(parser)->constval.t;
if (!parser_next(parser)) {
MEM_VECTOR_CLEAR(&params, p);
return NULL;
}
param = parser_parse_type(parser, temptype, &dummy);
(void)dummy;
if (!param) {
MEM_VECTOR_CLEAR(&params, p);
return NULL;
}
if (!paramlist_t_p_add(&params, param)) {
MEM_VECTOR_CLEAR(&params, p);
parseerror(parser, "Out of memory while parsing typename");
return NULL;
}
if (parser->tok == ',')
continue;
if (parser->tok == ')')
break;
MEM_VECTOR_CLEAR(&params, p);
parseerror(parser, "Unexpected token");
return NULL;
}
if (!parser_next(parser)) {
MEM_VECTOR_CLEAR(&params, p);
return NULL;
}
}
var = ast_value_new(ctx, "<unnamed>", vtype);
if (!var) {
MEM_VECTOR_CLEAR(&params, p);
return NULL;
}
MEM_VECTOR_MOVE(&params, p, var, params);
return var;
}
2012-07-20 12:04:52 +00:00
typedef struct
{
2012-07-20 13:02:18 +00:00
size_t etype; /* 0 = expression, others are operators */
2012-07-20 12:04:52 +00:00
ast_expression* out;
} sy_elem;
typedef struct
{
MEM_VECTOR_MAKE(sy_elem, out);
MEM_VECTOR_MAKE(sy_elem, ops);
} shynt;
MEM_VEC_FUNCTIONS(shynt, sy_elem, out)
MEM_VEC_FUNCTIONS(shynt, sy_elem, ops)
static sy_elem syexp(ast_expression *v) {
sy_elem e;
e.etype = 0;
e.out = v;
return e;
}
static sy_elem syval(ast_value *v) { return syexp((ast_expression*)v); }
2012-07-20 12:04:52 +00:00
2012-07-20 13:02:18 +00:00
static sy_elem syop(const oper_info *op) {
sy_elem e;
e.etype = 1 + (op - operators);
e.out = NULL;
return e;
}
static bool parser_sy_pop(parser_t *parser, shynt *sy)
{
return true;
}
2012-07-20 12:45:23 +00:00
static ast_expression* parser_expression(parser_t *parser)
2012-07-20 11:00:11 +00:00
{
2012-07-20 12:45:23 +00:00
ast_expression *expr = NULL;
shynt sy;
2012-07-20 12:45:23 +00:00
bool wantop = false;
2012-07-20 12:04:52 +00:00
MEM_VECTOR_INIT(&sy, out);
MEM_VECTOR_INIT(&sy, ops);
2012-07-20 12:45:23 +00:00
while (true)
{
2012-07-20 12:45:23 +00:00
if (!wantop)
{
if (parser->tok == TOKEN_IDENT)
{
/* variable */
ast_value *var = parser_find_var(parser, parser_tokval(parser));
if (!var) {
parseerror(parser, "unexpected ident: %s", parser_tokval(parser));
goto onerr;
}
if (!shynt_out_add(&sy, syval(var))) {
parseerror(parser, "out of memory");
goto onerr;
}
} else if (parser->tok == TOKEN_FLOATCONST) {
ast_value *val = parser_const_float(parser, (parser_token(parser)->constval.f));
if (!val)
return false;
if (!shynt_out_add(&sy, syval(val))) {
parseerror(parser, "out of memory");
goto onerr;
}
} else if (parser->tok == TOKEN_INTCONST) {
ast_value *val = parser_const_float(parser, (double)(parser_token(parser)->constval.i));
if (!val)
return false;
if (!shynt_out_add(&sy, syval(val))) {
parseerror(parser, "out of memory");
goto onerr;
}
} else {
/* TODO: prefix operators */
parseerror(parser, "expected statement");
goto onerr;
}
wantop = true;
parser->lex->flags.noops = false;
if (!parser_next(parser)) {
goto onerr;
}
} else {
if (parser->tok != TOKEN_OPERATOR) {
parseerror(parser, "expected operator or end of statement");
goto onerr;
} else {
/* classify the operator */
/* TODO: suffix operators */
2012-07-20 13:02:18 +00:00
const oper_info *op;
const oper_info *olast = NULL;
2012-07-20 12:45:23 +00:00
size_t o;
for (o = 0; o < operator_count; ++o) {
if (!(operators[o].flags & OP_PREFIX) &&
!(operators[o].flags & OP_SUFFIX) && /* remove this */
!strcmp(parser_tokval(parser), operators[o].op))
{
break;
}
}
if (o == operator_count) {
/* no operator found... must be the end of the statement */
break;
}
2012-07-20 13:02:18 +00:00
/* found an operator */
op = &operators[o];
if (sy.ops_count)
olast = &operators[sy.ops[sy.ops_count-1].etype-1];
while (olast && (
(op->prec < olast->prec) ||
(op->assoc == ASSOC_LEFT && op->prec <= olast->prec) ) )
{
if (!parser_sy_pop(parser, &sy))
goto onerr;
olast = sy.ops_count ? (&operators[sy.ops[sy.ops_count-1].etype-1]) : NULL;
}
if (!shynt_ops_add(&sy, syop(op)))
goto onerr;
2012-07-20 12:45:23 +00:00
}
wantop = false;
parser->lex->flags.noops = true;
if (!parser_next(parser)) {
goto onerr;
}
}
}
2012-07-20 13:02:18 +00:00
while (sy.ops_count) {
if (!parser_sy_pop(parser, &sy))
goto onerr;
}
2012-07-20 12:45:23 +00:00
parser->lex->flags.noops = true;
2012-07-20 13:02:18 +00:00
if (!sy.out_count) {
parseerror(parser, "empty expression");
expr = NULL;
} else
expr = sy.out[0].out;
MEM_VECTOR_CLEAR(&sy, out);
MEM_VECTOR_CLEAR(&sy, ops);
2012-07-20 12:45:23 +00:00
return expr;
onerr:
2012-07-20 12:45:23 +00:00
parser->lex->flags.noops = true;
2012-07-20 12:04:52 +00:00
MEM_VECTOR_CLEAR(&sy, out);
MEM_VECTOR_CLEAR(&sy, ops);
2012-07-20 12:45:23 +00:00
return NULL;
2012-07-20 11:00:11 +00:00
}
2012-07-20 10:46:59 +00:00
static bool parser_variable(parser_t *parser, bool global);
static bool parser_body_do(parser_t *parser, ast_block *block)
2012-07-19 17:57:24 +00:00
{
if (parser->tok == TOKEN_TYPENAME)
{
/* local variable */
2012-07-20 10:46:59 +00:00
if (!parser_variable(parser, false))
return false;
return true;
}
else if (parser->tok == '{')
{
/* a block */
2012-07-20 12:04:52 +00:00
parseerror(parser, "TODO: inner blocks");
return false;
}
2012-07-20 11:00:11 +00:00
else
2012-07-20 12:45:23 +00:00
{
ast_expression *exp = parser_expression(parser);
if (!exp)
return false;
if (!ast_block_exprs_add(block, exp))
return false;
return true;
}
2012-07-19 17:57:24 +00:00
}
2012-07-20 10:46:59 +00:00
static ast_block* parser_parse_block(parser_t *parser)
2012-07-16 12:14:37 +00:00
{
size_t oldblocklocal;
ast_block *block = NULL;
oldblocklocal = parser->blocklocal;
parser->blocklocal = parser->locals_count;
if (!parser_next(parser)) { /* skip the '{' */
parseerror(parser, "expected function body");
goto cleanup;
}
block = ast_block_new(parser_ctx(parser));
while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
2012-07-16 12:52:52 +00:00
{
if (parser->tok == '}')
break;
2012-07-16 12:52:52 +00:00
if (!parser_body_do(parser, block)) {
ast_block_delete(block);
block = NULL;
goto cleanup;
2012-07-16 12:52:52 +00:00
}
}
2012-07-20 10:46:59 +00:00
if (parser->tok != '}') {
ast_block_delete(block);
block = NULL;
} else {
(void)parser_next(parser);
}
cleanup:
parser->blocklocal = oldblocklocal;
return block;
}
2012-07-20 10:46:59 +00:00
static bool parser_variable(parser_t *parser, bool global)
{
bool isfunc = false;
ast_function *func = NULL;
lex_ctx ctx;
ast_value *var;
int basetype = parser_token(parser)->constval.t;
while (true)
{
if (!parser_next(parser)) { /* skip basetype or comma */
parseerror(parser, "expected variable declaration");
return false;
}
isfunc = false;
func = NULL;
ctx = parser_ctx(parser);
var = parser_parse_type(parser, basetype, &isfunc);
2012-07-16 12:52:52 +00:00
if (!var)
return false;
if (parser->tok != TOKEN_IDENT) {
parseerror(parser, "expected variable name\n");
return false;
}
if (global && parser_find_global(parser, parser_tokval(parser))) {
ast_value_delete(var);
parseerror(parser, "global already exists: %s\n", parser_tokval(parser));
2012-07-16 12:52:52 +00:00
return false;
}
if (!global && parser_find_local(parser, parser_tokval(parser), parser->blocklocal)) {
ast_value_delete(var);
parseerror(parser, "local variable already exists: %s\n", parser_tokval(parser));
return false;
}
if (!ast_value_set_name(var, parser_tokval(parser))) {
parseerror(parser, "failed to set variable name\n");
ast_value_delete(var);
return false;
}
if (isfunc) {
/* a function was defined */
ast_value *fval;
/* turn var into a value of TYPE_FUNCTION, with the old var
* as return type
*/
fval = ast_value_new(ctx, var->name, TYPE_FUNCTION);
func = ast_function_new(ctx, var->name, fval);
if (!fval || !func) {
ast_value_delete(var);
if (fval) ast_value_delete(fval);
if (func) ast_function_delete(func);
return false;
}
fval->expression.next = (ast_expression*)var;
MEM_VECTOR_MOVE(var, params, fval, params);
if (!parser_t_functions_add(parser, func)) {
ast_value_delete(var);
if (fval) ast_value_delete(fval);
if (func) ast_function_delete(func);
return false;
}
var = fval;
2012-07-19 15:39:19 +00:00
}
if ( ( global && !parser_t_globals_add(parser, var)) ||
(!global && !parser_t_locals_add(parser, var)) )
{
ast_value_delete(var);
return false;
2012-07-19 10:17:00 +00:00
}
if (!parser_next(parser)) {
ast_value_delete(var);
2012-07-19 10:17:00 +00:00
return false;
}
if (parser->tok == ';') {
if (!parser_next(parser))
return parser->tok == TOKEN_EOF;
return true;
}
2012-07-19 10:17:00 +00:00
if (parser->tok == ',') {
/* another var */
continue;
}
2012-07-19 15:39:19 +00:00
if (parser->tok != '=') {
parseerror(parser, "expected '=' or ';'");
return false;
2012-07-19 15:39:19 +00:00
}
if (!parser_next(parser))
return false;
if (parser->tok == '#') {
if (!global) {
parseerror(parser, "cannot declare builtins within functions");
return false;
}
if (!isfunc || !func) {
parseerror(parser, "unexpected builtin number, '%s' is not a function", var->name);
return false;
}
if (!parser_next(parser)) {
parseerror(parser, "expected builtin number");
return false;
}
if (parser->tok != TOKEN_INTCONST) {
parseerror(parser, "builtin number must be an integer constant");
return false;
}
if (parser_token(parser)->constval.i <= 0) {
parseerror(parser, "builtin number must be positive integer greater than zero");
return false;
}
func->builtin = -parser_token(parser)->constval.i;
} else if (parser->tok == '{') {
/* function body */
ast_block *block;
ast_function *old = parser->function;
if (!global) {
parseerror(parser, "cannot declare functions within functions");
return false;
}
parser->function = func;
block = parser_parse_block(parser);
parser->function = old;
if (!block)
return false;
if (!ast_function_blocks_add(func, block)) {
ast_block_delete(block);
return false;
}
return true;
} else {
parseerror(parser, "TODO, const assignment");
}
if (!parser_next(parser))
2012-07-19 15:39:19 +00:00
return false;
if (parser->tok == ',') {
/* another */
continue;
}
if (parser->tok != ';') {
parseerror(parser, "expected semicolon");
2012-07-19 15:39:19 +00:00
return false;
}
(void)parser_next(parser);
return true;
}
}
2012-07-20 10:46:59 +00:00
static bool parser_do(parser_t *parser)
{
if (parser->tok == TOKEN_TYPENAME)
{
return parser_variable(parser, true);
2012-07-16 12:52:52 +00:00
}
else if (parser->tok == TOKEN_KEYWORD)
{
/* handle 'var' and 'const' */
return false;
}
else if (parser->tok == '.')
{
/* entity-member declaration */
return false;
}
else
{
parseerror(parser, "unexpected token: %s", parser->lex->tok->value);
return false;
}
2012-07-16 12:14:37 +00:00
return true;
}
2012-07-16 11:59:10 +00:00
bool parser_compile(const char *filename)
{
2012-07-16 12:52:52 +00:00
size_t i;
2012-07-16 12:14:37 +00:00
parser_t *parser;
ir_builder *ir;
2012-07-16 12:14:37 +00:00
parser = (parser_t*)mem_a(sizeof(parser_t));
if (!parser)
return false;
memset(parser, 0, sizeof(parser));
2012-07-16 12:52:52 +00:00
MEM_VECTOR_INIT(parser, globals);
MEM_VECTOR_INIT(parser, locals);
2012-07-16 12:14:37 +00:00
parser->lex = lex_open(filename);
if (!parser->lex) {
printf("failed to open file \"%s\"\n", filename);
return false;
}
2012-07-16 12:52:52 +00:00
/* initial lexer/parser state */
parser->lex->flags.noops = true;
if (parser_next(parser))
2012-07-16 12:14:37 +00:00
{
2012-07-16 12:52:52 +00:00
while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
{
if (!parser_do(parser)) {
2012-07-19 09:22:09 +00:00
if (parser->tok == TOKEN_EOF)
2012-07-19 10:17:00 +00:00
parseerror(parser, "unexpected eof");
else
parseerror(parser, "parse error\n");
2012-07-16 12:52:52 +00:00
lex_close(parser->lex);
mem_d(parser);
return false;
}
2012-07-16 12:14:37 +00:00
}
}
lex_close(parser->lex);
ir = ir_builder_new("gmqcc_out");
if (!ir) {
printf("failed to allocate builder\n");
goto cleanup;
}
for (i = 0; i < parser->imm_float_count; ++i) {
if (!ast_global_codegen(parser->imm_float[i], ir)) {
printf("failed to generate global %s\n", parser->imm_float[i]->name);
}
}
for (i = 0; i < parser->globals_count; ++i) {
if (!ast_global_codegen(parser->globals[i], ir)) {
printf("failed to generate global %s\n", parser->globals[i]->name);
}
}
for (i = 0; i < parser->functions_count; ++i) {
if (!ast_function_codegen(parser->functions[i], ir)) {
printf("failed to generate function %s\n", parser->functions[i]->name);
}
if (!ir_function_finalize(parser->functions[i]->ir_func)) {
printf("failed to finalize function %s\n", parser->functions[i]->name);
}
}
ir_builder_dump(ir, printf);
cleanup:
2012-07-16 12:52:52 +00:00
for (i = 0; i < parser->globals_count; ++i) {
ast_value_delete(parser->globals[i]);
}
MEM_VECTOR_CLEAR(parser, globals);
2012-07-16 12:14:37 +00:00
mem_d(parser);
return true;
2012-07-16 11:59:10 +00:00
}