mirror of
https://git.code.sf.net/p/quake/quakeforge
synced 2025-02-26 05:31:50 +00:00
963 lines
24 KiB
Text
963 lines
24 KiB
Text
/*
|
||
qc-lex.l
|
||
|
||
lexer for quakec
|
||
|
||
Copyright (C) 2001 Bill Currie <bill@taniwha.org>
|
||
|
||
Author: Bill Currie <bill@taniwha.org>
|
||
Date: 2001/06/12
|
||
|
||
This program is free software; you can redistribute it and/or
|
||
modify it under the terms of the GNU General Public License
|
||
as published by the Free Software Foundation; either version 2
|
||
of the License, or (at your option) any later version.
|
||
|
||
This program is distributed in the hope that it will be useful,
|
||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
||
|
||
See the GNU General Public License for more details.
|
||
|
||
You should have received a copy of the GNU General Public License
|
||
along with this program; if not, write to:
|
||
|
||
Free Software Foundation, Inc.
|
||
59 Temple Place - Suite 330
|
||
Boston, MA 02111-1307, USA
|
||
|
||
*/
|
||
%option bison-locations
|
||
%option bison-bridge
|
||
%option reentrant
|
||
%option prefix="qc_yy"
|
||
%option noyywrap
|
||
%option debug
|
||
|
||
%top{
|
||
#ifdef HAVE_CONFIG_H
|
||
# include "config.h"
|
||
#endif
|
||
|
||
#ifdef HAVE_STRING_H
|
||
# include <string.h>
|
||
#endif
|
||
#ifdef HAVE_STRINGS_H
|
||
# include <strings.h>
|
||
#endif
|
||
#include <stdlib.h>
|
||
#include <ctype.h>
|
||
|
||
#include <QF/dstring.h>
|
||
#include <QF/hash.h>
|
||
#include <QF/sys.h>
|
||
|
||
#include "tools/qfcc/include/class.h"
|
||
#include "tools/qfcc/include/debug.h"
|
||
#include "tools/qfcc/include/diagnostic.h"
|
||
#include "tools/qfcc/include/expr.h"
|
||
#include "tools/qfcc/include/grab.h"
|
||
#include "tools/qfcc/include/options.h"
|
||
#include "tools/qfcc/include/pragma.h"
|
||
#include "tools/qfcc/include/qfcc.h"
|
||
#include "tools/qfcc/include/rua-lang.h"
|
||
#include "tools/qfcc/include/shared.h"
|
||
#include "tools/qfcc/include/strpool.h"
|
||
#include "tools/qfcc/include/struct.h"
|
||
#include "tools/qfcc/include/symtab.h"
|
||
#include "tools/qfcc/include/type.h"
|
||
#include "tools/qfcc/include/value.h"
|
||
}
|
||
|
||
%{
|
||
#ifndef YY_PROTO
|
||
# define YY_PROTO(x) x
|
||
#else
|
||
# define YY_FLEX_REALLOC_HACK
|
||
#endif
|
||
|
||
#define YY_NO_INPUT // debian flex
|
||
#define YY_NO_UNPUT // debian flex
|
||
#define YY_NO_YYINPUT
|
||
#define YY_NO_YYUNPUT
|
||
|
||
#define YYSTYPE rua_tok_t
|
||
#define YYLTYPE rua_loc_t
|
||
|
||
typedef struct rua_extra_s {
|
||
int start_state;
|
||
} rua_extra_t;
|
||
#define YY_EXTRA_TYPE rua_extra_t *
|
||
|
||
rua_extra_t *qc_yyget_extra (yyscan_t yyscanner) __attribute__((pure));
|
||
int yyget_lineno (yyscan_t yyscanner) __attribute__((pure));
|
||
int yyget_column (yyscan_t yyscanner) __attribute__((pure));
|
||
YYSTYPE *yyget_lval (yyscan_t yyscanner) __attribute__((pure));
|
||
YYLTYPE *yyget_lloc (yyscan_t yyscanner) __attribute__((pure));
|
||
int yyget_leng (yyscan_t yyscanner) __attribute__((pure));
|
||
char *yyget_text (yyscan_t yyscanner) __attribute__((pure));
|
||
int yyget_debug (yyscan_t yyscanner) __attribute__((pure));
|
||
FILE *yyget_in (yyscan_t yyscanner) __attribute__((pure));
|
||
FILE *yyget_out (yyscan_t yyscanner) __attribute__((pure));
|
||
|
||
static int keyword_or_id (YYSTYPE *lval, const char *token);
|
||
static void user_action (rua_tok_t *tok, rua_loc_t *loc,
|
||
const char *text, size_t textlen);
|
||
|
||
enum {
|
||
rua_eof = 1,
|
||
rua_error,
|
||
rua_number,
|
||
rua_vector,
|
||
rua_string,
|
||
rua_char,
|
||
};
|
||
|
||
#define YY_USER_ACTION user_action (yylval, yylloc, yytext, yyleng);
|
||
|
||
%}
|
||
|
||
s [ \t]
|
||
m [\-+]
|
||
D [0-9]
|
||
IDs [a-zA-Z_]
|
||
IDc [a-zA-Z_0-9]
|
||
ID {IDs}{IDc}*
|
||
FD [fFdD]
|
||
UL ([uU]?([lL][lL]?)?)
|
||
ULFD ({UL}|{FD})
|
||
RANGE \.\.
|
||
ELLIPSIS \.\.\.
|
||
FRAMEID {ID}(\.{ID})*
|
||
PRAGMAID {ID}(-{ID})*
|
||
s_string \"(\\.|[^"\\])*\"
|
||
c_string '(\\.|[^'\\])*'
|
||
|
||
pp_number \.?{D}({IDc}|'{IDc}|[eEpP]{m}|\.)*
|
||
|
||
%x GRAB_FRAME GRAB_OTHER GRAB_WRITE COMMENT LCOMMENT PRAGMA
|
||
%x VECTOR
|
||
|
||
%%
|
||
auto extra = qc_yyget_extra (yyscanner);
|
||
BEGIN (extra->start_state);
|
||
yyset_debug (0, yyscanner);
|
||
grab_frame = GRAB_FRAME;
|
||
grab_other = GRAB_OTHER;
|
||
grab_write = GRAB_WRITE;
|
||
yylval->pointer = 0; // ensure pointer vals are null
|
||
|
||
"/*" { BEGIN (COMMENT); }
|
||
<COMMENT>"/*" { warning (0, "nested /* in comment"); }
|
||
<COMMENT>"*/" { BEGIN (INITIAL); }
|
||
<COMMENT>\r*\n { pr.source_line++; }
|
||
<COMMENT>. /* nothing to do */
|
||
<COMMENT><<EOF>> { error (0, "EOF in comment"); return 0; }
|
||
"//" { BEGIN (LCOMMENT); } /* exited by <*>\r\n rule */
|
||
<LCOMMENT>[^\\\r\n]* /* consume all but \ and EOL (see line continuation) */
|
||
<LCOMMENT>[\\]* /* consume \ */
|
||
|
||
^#{s}+{D}+{s}+\"(\.|[^"\n])*\".*$ { line_info (yytext + 1); }
|
||
^#line{s}+{D}+{s}+\"(\.|[^"\n])*\".*$ { line_info (yytext + 5); }
|
||
|
||
^{s}*#{s}*pragma{s}+ { BEGIN (PRAGMA); }
|
||
|
||
{ID} {
|
||
int tok = keyword_or_id(yylval, yytext);
|
||
return tok;
|
||
}
|
||
@{ID} {
|
||
int tok = keyword_or_id(yylval, yytext);
|
||
if (tok == '@')
|
||
REJECT;
|
||
return tok;
|
||
}
|
||
|
||
@ return '@';
|
||
|
||
{pp_number} { return -rua_number; }
|
||
'({s}*{m}?{pp_number}){2,4}{s}*'{ULFD}? { return -rua_vector; }
|
||
<VECTOR>{pp_number} { return -rua_number; }
|
||
<VECTOR>{m} { return yytext[0]; }
|
||
<VECTOR>' { return -rua_eof; }
|
||
|
||
{s_string} { return -rua_string; };
|
||
{c_string} { return -rua_char; }
|
||
[+\-*/&|^%]= {
|
||
yylval->value.op = yytext[0];
|
||
return ASX;
|
||
}
|
||
|
||
"%%=" {
|
||
yylval->value.op = MOD;
|
||
return ASX;
|
||
}
|
||
|
||
"<<=" {
|
||
yylval->value.op = SHL;
|
||
return ASX;
|
||
}
|
||
|
||
">>=" {
|
||
yylval->value.op = SHR;
|
||
return ASX;
|
||
}
|
||
|
||
[!(){}.*/&|^~+\-=\[\];,#%?:] {
|
||
return yytext[0];
|
||
}
|
||
|
||
"·" { return DOT; }
|
||
"â‹€" { return WEDGE; }
|
||
"•" { return DOT; }
|
||
"∧" { return WEDGE; }
|
||
"∨" { return REGRESSIVE; }
|
||
"†" { return REVERSE; }
|
||
"∗" { return STAR; }
|
||
"×" { return CROSS; }
|
||
"⋆" { return DUAL; }
|
||
|
||
"%%" {
|
||
return MOD;
|
||
}
|
||
|
||
{ELLIPSIS} return ELLIPSIS;
|
||
|
||
"<<" return SHL;
|
||
">>" return SHR;
|
||
|
||
"&&" return AND;
|
||
"||" return OR;
|
||
"==" return EQ;
|
||
"!=" return NE;
|
||
"<=" return LE;
|
||
">=" return GE;
|
||
"<" return LT;
|
||
">" return GT;
|
||
|
||
"++" {
|
||
yylval->value.op = '+';
|
||
return INCOP;
|
||
}
|
||
|
||
"--" {
|
||
yylval->value.op = '-';
|
||
return INCOP;
|
||
}
|
||
|
||
"$"{s}*{FRAMEID} {
|
||
int ret = do_grab (yytext);
|
||
if (ret >= 0) {
|
||
yylval->value.expr = new_int_expr (ret, false);
|
||
return VALUE;
|
||
} else {
|
||
BEGIN (-ret);
|
||
}
|
||
}
|
||
|
||
<GRAB_FRAME>{FRAMEID} add_frame_macro (yytext);
|
||
<GRAB_OTHER>[^\r\n]* /* skip */
|
||
<GRAB_WRITE>{s_string} {
|
||
const char *s = make_string (yytext, 0);
|
||
write_frame_macros (s);
|
||
BEGIN (GRAB_OTHER); // ignore rest of line
|
||
}
|
||
<PRAGMA>{PRAGMAID} { pragma_add_arg (yytext); }
|
||
<PRAGMA>@{PRAGMAID} { pragma_add_arg (yytext); }
|
||
|
||
<*>\\\r*\n { pr.source_line++; } /* line continuation */
|
||
<*>\r*\n {
|
||
if (YY_START == PRAGMA) {
|
||
pragma_process ();
|
||
}
|
||
pr.source_line++;
|
||
BEGIN (INITIAL);
|
||
}
|
||
|
||
<*>{s}* /* skip */
|
||
|
||
<*>. error (0, "all your typo are belong to us");
|
||
|
||
%%
|
||
|
||
typedef struct {
|
||
const char *name;
|
||
int value;
|
||
specifier_t spec;
|
||
} keyword_t;
|
||
|
||
// These keywords are part of the Ruamoko language and require the QuakeForge
|
||
// Ruamoko VM.
|
||
static keyword_t rua_keywords[] = {
|
||
#define VEC_TYPE(type_name, base_type) \
|
||
{ #type_name, TYPE_SPEC, .spec = { .type = &type_##type_name } },
|
||
#include "tools/qfcc/include/vec_types.h"
|
||
};
|
||
|
||
// These keywords are all part of the Ruamoko (Objective-QC) language.
|
||
// The first time any one of them is encountered, the class system will be
|
||
// initialized.
|
||
// If not compiling for the QuakeForge VM, or if Ruamoko has been disabled,
|
||
// then they will be unavailable as keywords.
|
||
static keyword_t obj_keywords[] = {
|
||
{"id", OBJECT_NAME, .spec = { .type = &type_id } },
|
||
{"Class", TYPE_SPEC, .spec = { .type = &type_Class } },
|
||
{"Method", TYPE_SPEC, .spec = { .type = &type_method } },
|
||
{"Super", TYPE_SPEC, .spec = { .type = &type_super } },
|
||
{"SEL", TYPE_SPEC, .spec = { .type = &type_SEL } },
|
||
{"IMP", TYPE_SPEC, .spec = { .type = &type_IMP } },
|
||
|
||
{"@class", CLASS },
|
||
{"@defs", DEFS },
|
||
{"@encode", ENCODE },
|
||
{"@end", END },
|
||
{"@implementation", IMPLEMENTATION },
|
||
{"@interface", INTERFACE },
|
||
{"@private", PRIVATE },
|
||
{"@protected", PROTECTED },
|
||
{"@protocol", PROTOCOL },
|
||
{"@public", PUBLIC },
|
||
{"@reference", REFERENCE },
|
||
{"@selector", SELECTOR },
|
||
{"@self", SELF },
|
||
{"@this", THIS },
|
||
|
||
// This is a hack to trigger the initialization of the class
|
||
// sytem if it is seen before any other Objective-QC symbol. Otherwise,
|
||
// it is just an identifier, though it does reference a built-in type
|
||
// created by the class system.
|
||
{"obj_module", 0 },
|
||
};
|
||
|
||
// These keywords are extensions to QC and thus available only in advanced
|
||
// or extended code. However, if they are preceeded by an @ (eg, @for), then
|
||
// they are always available. This is to prevent them from causing trouble
|
||
// for traditional code that might use these words as identifiers, but still
|
||
// make the language features available to traditional code.
|
||
static keyword_t at_keywords[] = {
|
||
{"for", FOR },
|
||
{"goto", GOTO },
|
||
{"break", BREAK },
|
||
{"continue", CONTINUE},
|
||
{"switch", SWITCH },
|
||
{"case", CASE },
|
||
{"default", DEFAULT },
|
||
{"nil", NIL },
|
||
{"struct", STRUCT },
|
||
{"union", STRUCT },
|
||
{"enum", ENUM },
|
||
{"typedef", TYPEDEF },
|
||
{"extern", EXTERN },
|
||
{"static", STATIC },
|
||
{"sizeof", SIZEOF },
|
||
{"not", NOT },
|
||
{"auto", TYPE_SPEC, .spec = { .type = &type_auto } },
|
||
};
|
||
|
||
// These keywords require the QuakeForge VM to be of any use. ie, they cannot
|
||
// be supported (sanely) by v6 progs.
|
||
static keyword_t qf_keywords[] = {
|
||
{"quaternion", TYPE_SPEC, .spec = { .type = &type_quaternion } },
|
||
{"double", TYPE_SPEC, .spec = { .type = &type_double } },
|
||
{"int", TYPE_SPEC, .spec = { .type = &type_int } },
|
||
{"unsigned", TYPE_SPEC, .spec = { .is_unsigned = 1 } },
|
||
{"signed", TYPE_SPEC, .spec = { .is_signed = 1 } },
|
||
{"long", TYPE_SPEC, .spec = { .is_long = 1 } },
|
||
{"short", TYPE_SPEC, .spec = { .is_short = 1 } },
|
||
|
||
{"@function", TYPE_SPEC, .spec = { .type = &type_func } },
|
||
{"@args", ARGS, },
|
||
{"@va_list", TYPE_SPEC, .spec = { .type = &type_va_list } },
|
||
{"@param", TYPE_SPEC, .spec = { .type = &type_param } },
|
||
{"@return", AT_RETURN, },
|
||
|
||
{"@hadamard", HADAMARD, },
|
||
{"@cross", CROSS, },
|
||
{"@dot", DOT, },
|
||
{"@wedge", WEDGE, },
|
||
{"@regressive", REGRESSIVE, },
|
||
{"@geometric", GEOMETRIC, },
|
||
{"@algebra", ALGEBRA, },
|
||
};
|
||
|
||
// These keywors are always available. Other than the @ keywords, they
|
||
// form traditional QuakeC.
|
||
static keyword_t keywords[] = {
|
||
{"void", TYPE_SPEC, .spec = { .type = &type_void } },
|
||
{"float", TYPE_SPEC, .spec = { .type = &type_float } },
|
||
{"string", TYPE_SPEC, .spec = { .type = &type_string } },
|
||
{"vector", TYPE_SPEC, .spec = { .type = &type_vector } },
|
||
{"entity", TYPE_SPEC, .spec = { .type = &type_entity } },
|
||
{"local", LOCAL, },
|
||
{"return", RETURN, },
|
||
{"while", WHILE, },
|
||
{"do", DO, },
|
||
{"if", IF, },
|
||
{"else", ELSE, },
|
||
{"@system", SYSTEM, },
|
||
{"@overload", OVERLOAD, },
|
||
{"@attribute", ATTRIBUTE, },
|
||
{"@handle", HANDLE, },
|
||
};
|
||
|
||
static const char *
|
||
keyword_get_key (const void *kw, void *unused)
|
||
{
|
||
return ((keyword_t*)kw)->name;
|
||
}
|
||
|
||
static int
|
||
process_keyword (YYSTYPE *lval, keyword_t *keyword, const char *token)
|
||
{
|
||
if (keyword->value == STRUCT) {
|
||
lval->value.op = token[0];
|
||
} else if (keyword->value == OBJECT_NAME) {
|
||
symbol_t *sym;
|
||
|
||
sym = symtab_lookup (current_symtab, token);
|
||
lval->value.symbol = sym;
|
||
// the global id symbol is always just a name so attempts to redefine
|
||
// it globally can be caught and treated as an error, but it needs to
|
||
// be redefinable when in an enclosing scope.
|
||
if (sym->sy_type == sy_name) {
|
||
// this is the global id (object)
|
||
lval->value.spec = (specifier_t) {
|
||
.type = sym->type,
|
||
.sym = sym,
|
||
};
|
||
return OBJECT_NAME;
|
||
} else if (sym->sy_type == sy_type) {
|
||
// id has been redeclared via a typedef
|
||
lval->value.spec = (specifier_t) {
|
||
.type = sym->type,
|
||
.sym = sym,
|
||
};
|
||
return TYPE_NAME;
|
||
}
|
||
// id has been redelcared as a variable (hopefully)
|
||
return NAME;
|
||
} else {
|
||
lval->value.spec = keyword->spec;
|
||
}
|
||
return keyword->value;
|
||
}
|
||
|
||
static int
|
||
keyword_or_id (YYSTYPE *lval, const char *token)
|
||
{
|
||
static hashtab_t *keyword_tab;
|
||
static hashtab_t *qf_keyword_tab;
|
||
static hashtab_t *at_keyword_tab;
|
||
static hashtab_t *obj_keyword_tab;
|
||
static hashtab_t *rua_keyword_tab;
|
||
|
||
keyword_t *keyword = 0;
|
||
symbol_t *sym;
|
||
|
||
if (!keyword_tab) {
|
||
size_t i;
|
||
|
||
keyword_tab = Hash_NewTable (253, keyword_get_key, 0, 0, 0);
|
||
qf_keyword_tab = Hash_NewTable (253, keyword_get_key, 0, 0, 0);
|
||
at_keyword_tab = Hash_NewTable (253, keyword_get_key, 0, 0, 0);
|
||
obj_keyword_tab = Hash_NewTable (253, keyword_get_key, 0, 0, 0);
|
||
rua_keyword_tab = Hash_NewTable (253, keyword_get_key, 0, 0, 0);
|
||
|
||
#define NUMKEYS(_k) (sizeof (_k) / sizeof (_k[0]))
|
||
|
||
for (i = 0; i < NUMKEYS(keywords); i++)
|
||
Hash_Add (keyword_tab, &keywords[i]);
|
||
for (i = 0; i < NUMKEYS(qf_keywords); i++)
|
||
Hash_Add (qf_keyword_tab, &qf_keywords[i]);
|
||
for (i = 0; i < NUMKEYS(at_keywords); i++)
|
||
Hash_Add (at_keyword_tab, &at_keywords[i]);
|
||
for (i = 0; i < NUMKEYS(obj_keywords); i++)
|
||
Hash_Add (obj_keyword_tab, &obj_keywords[i]);
|
||
for (i = 0; i < NUMKEYS(rua_keywords); i++)
|
||
Hash_Add (rua_keyword_tab, &rua_keywords[i]);
|
||
}
|
||
if (options.traditional < 1) {
|
||
if (options.code.progsversion == PROG_VERSION) {
|
||
keyword = Hash_Find (rua_keyword_tab, token);
|
||
}
|
||
if (!keyword) {
|
||
keyword = Hash_Find (obj_keyword_tab, token);
|
||
if (keyword) {
|
||
if (!obj_initialized)
|
||
class_init ();
|
||
}
|
||
}
|
||
if (!keyword)
|
||
keyword = Hash_Find (qf_keyword_tab, token);
|
||
}
|
||
if (!keyword && options.traditional < 2)
|
||
keyword = Hash_Find (at_keyword_tab, token);
|
||
if (!keyword && token[0] == '@') {
|
||
keyword = Hash_Find (at_keyword_tab, token + 1);
|
||
if (keyword)
|
||
token += 1;
|
||
}
|
||
if (!keyword)
|
||
keyword = Hash_Find (keyword_tab, token);
|
||
if (keyword && keyword->value)
|
||
return process_keyword (lval, keyword, token);
|
||
if (token[0] == '@') {
|
||
return '@';
|
||
}
|
||
sym = symtab_lookup (current_symtab, token);
|
||
if (!sym)
|
||
sym = new_symbol (token);
|
||
lval->value.symbol = sym;
|
||
if (sym->sy_type == sy_type) {
|
||
lval->value.spec = (specifier_t) {
|
||
.type = sym->type,
|
||
.sym = sym,
|
||
};
|
||
return TYPE_NAME;
|
||
}
|
||
if (sym->sy_type == sy_class)
|
||
return CLASS_NAME;
|
||
return NAME;
|
||
}
|
||
|
||
enum {
|
||
suff_error = -1,
|
||
suff_implicit,
|
||
suff_unsigned,
|
||
suff_long,
|
||
suff_unsigned_long,
|
||
suff_float,
|
||
suff_double,
|
||
suff_long_double,
|
||
};
|
||
|
||
static int
|
||
parse_suffix (const char *suffix, bool fp)
|
||
{
|
||
int expl = suff_implicit;
|
||
bool unsign = false;
|
||
|
||
if (!*suffix) {
|
||
return 0;
|
||
}
|
||
if (fp) {
|
||
if (*suffix == 'f' || *suffix == 'F') {
|
||
expl = suff_float;
|
||
suffix++;
|
||
} else if (*suffix == 'd' || *suffix == 'D') {
|
||
// treat as explicit double unless it's a proper C decimal
|
||
// suffix, in which case the decimal part will be ignored
|
||
// (non-standard, but no decimal supprt)
|
||
expl = suff_double;
|
||
suffix++;
|
||
if (*suffix == 'f' || *suffix == 'F'
|
||
|| *suffix == 'd' || *suffix == 'D'
|
||
|| *suffix == 'l' || *suffix == 'L') {
|
||
warning (0, "decimal fp treated as binary fp");
|
||
expl = suff_double;
|
||
suffix++;
|
||
}
|
||
} else if (*suffix == 'l' || *suffix == 'L') {
|
||
expl = suff_long_double;
|
||
suffix++;
|
||
}
|
||
} else {
|
||
if (*suffix == 'f' || *suffix == 'F') {
|
||
expl = suff_float;
|
||
suffix++;
|
||
} else if (*suffix == 'd' || *suffix == 'D') {
|
||
expl = suff_double;
|
||
suffix++;
|
||
} else {
|
||
if (*suffix == 'u' || *suffix == 'U') {
|
||
unsign = true;
|
||
expl = suff_unsigned;
|
||
suffix++;
|
||
}
|
||
if (*suffix == 'l' || *suffix == 'L') {
|
||
expl = unsign ? suff_unsigned_long : suff_long;
|
||
suffix++;
|
||
if (*suffix == 'l' || *suffix == 'L') {
|
||
suffix++;
|
||
}
|
||
if (!unsign && (*suffix == 'u' || *suffix == 'U')) {
|
||
expl = suff_unsigned_long;
|
||
suffix++;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
if (*suffix) {
|
||
return suff_error;
|
||
}
|
||
|
||
return expl;
|
||
}
|
||
|
||
static int
|
||
parse_number (rua_tok_t *tok, yyscan_t scanner)
|
||
{
|
||
bool binary = false;
|
||
const char *type = "integer";
|
||
bool hex = false;
|
||
bool fp = false;
|
||
char buf[tok->textlen + 1], *dst = buf;
|
||
const char *src = tok->text;
|
||
if ((*dst = *src++) == '0') {
|
||
switch ((*++dst = *src++)) {
|
||
case 'b': case 'B':
|
||
binary = true;
|
||
type = "binary";
|
||
break;
|
||
case 'x': case 'X':
|
||
hex = true;
|
||
type = "hexadecimal";
|
||
break;
|
||
case '.':
|
||
fp = true;
|
||
break;
|
||
case '1' ... '9':
|
||
type = "octal"; // unless fp becomes true
|
||
break;
|
||
case '\'': case '_':
|
||
if (*src == 'b' || *src == 'B' || *src == 'x' || *src == 'X') {
|
||
error (0, "digit separator outside digit sequence");
|
||
return -rua_error;
|
||
}
|
||
break;
|
||
}
|
||
}
|
||
if (*dst) {
|
||
dst += (*dst != '\'' && *dst != '_');
|
||
while ((*dst = *src++)) {
|
||
if (hex && (*dst == 'p' || *dst == 'P')) {
|
||
fp = true;
|
||
}
|
||
if (!hex && (*dst == 'e' || *dst == 'E')) {
|
||
fp = true;
|
||
}
|
||
if (*dst == '.') {
|
||
fp = true;
|
||
}
|
||
// strip out digit separators (' is standard C, _ is a rust
|
||
// thing, but it does look a bit nicerer than ', so why not).
|
||
dst += (*dst != '\'' && *dst != '_');
|
||
}
|
||
}
|
||
// use long long to avoid bit-size issues on windows
|
||
long long lvalue = 0;
|
||
double fvalue = 0;
|
||
char *endptr = 0;
|
||
if (binary) {
|
||
// to get here, 0b (or 0B) was seen, so buf is guaranted to start with
|
||
// that
|
||
lvalue = strtoll (buf + 2, &endptr, 2);
|
||
} else {
|
||
if (fp) {
|
||
fvalue = strtod (buf, &endptr);
|
||
} else {
|
||
lvalue = strtoll (buf, &endptr, 0);
|
||
}
|
||
}
|
||
|
||
int expl = parse_suffix (endptr, fp);
|
||
if (expl < 0) {
|
||
error (0, "invalid suffix \"%s\" on %s constant", endptr,
|
||
fp ? "floating" : type);
|
||
return -rua_error;
|
||
}
|
||
|
||
if (fp) {
|
||
if (expl == suff_float) {
|
||
tok->value.expr = new_float_expr (fvalue);
|
||
} else {
|
||
if (expl == suff_long_double) {
|
||
warning (0, "long double treated as double");
|
||
expl = suff_double;
|
||
}
|
||
tok->value.expr = new_double_expr (fvalue, expl == suff_implicit);
|
||
}
|
||
} else {
|
||
if (expl == suff_unsigned) {
|
||
tok->value.expr = new_uint_expr (lvalue);
|
||
} else if (expl == suff_long || expl == suff_implicit) {
|
||
tok->value.expr = new_long_expr (lvalue, expl == suff_implicit);
|
||
} else if (expl == suff_unsigned_long) {
|
||
tok->value.expr = new_ulong_expr (lvalue);
|
||
} else if (expl == suff_float) {
|
||
tok->value.expr = new_float_expr (lvalue);
|
||
} else if (expl == suff_double) {
|
||
tok->value.expr = new_double_expr (lvalue, false);
|
||
} else {
|
||
internal_error (0, "invalid suffix enum: %d", expl);
|
||
}
|
||
}
|
||
return VALUE;
|
||
}
|
||
|
||
typedef struct {
|
||
yyscan_t scanner;
|
||
yybuffer buffer;
|
||
} buffer_raii_t;
|
||
|
||
static void
|
||
qc_restore_buffer (buffer_raii_t *raii)
|
||
{
|
||
yy_switch_to_buffer (raii->buffer, raii->scanner);
|
||
}
|
||
|
||
static void
|
||
qc_delete_buffer (buffer_raii_t *raii)
|
||
{
|
||
yy_delete_buffer (raii->buffer, raii->scanner);
|
||
}
|
||
|
||
static int
|
||
parse_vector (rua_tok_t *tok, yyscan_t scanner)
|
||
{
|
||
const char *end = tok->text + tok->textlen;
|
||
while (end > tok->text && *--end != '\'') continue;
|
||
|
||
const char *start = tok->text + 1;
|
||
auto yyg = (struct yyguts_t *)scanner;
|
||
auto __attribute__((cleanup (qc_restore_buffer)))
|
||
saved_buffer = (buffer_raii_t) {
|
||
.scanner = scanner,
|
||
.buffer = YY_CURRENT_BUFFER,
|
||
};
|
||
auto __attribute__((cleanup (qc_delete_buffer)))
|
||
buffer = (buffer_raii_t) {
|
||
.scanner = scanner,
|
||
.buffer = yy_scan_bytes (start, end - start, scanner),
|
||
};
|
||
|
||
int token;
|
||
rua_tok_t vtok = { .location = tok->location, };
|
||
vtok.location.first_column++;
|
||
const expr_t *components[4+1] = {}; // currently, max of 4
|
||
bool negate[4] = {};
|
||
int width = 0;
|
||
|
||
auto extra = qc_yyget_extra (scanner);
|
||
extra->start_state = VECTOR;
|
||
do {
|
||
token = yylex (&vtok, &vtok.location, scanner);
|
||
if (-token == rua_number) {
|
||
token = parse_number (&vtok, scanner);
|
||
}
|
||
if (token == VALUE) {
|
||
if (width < 4) {
|
||
components[width] = vtok.value.expr;
|
||
}
|
||
width++;
|
||
} else if (token == '-') {
|
||
if (width < 4) {
|
||
negate[width] = true;
|
||
}
|
||
}
|
||
} while (token && token != -rua_eof);
|
||
extra->start_state = INITIAL;
|
||
|
||
if (width > 4) {
|
||
error (0, "too many components in vector literal");
|
||
width = 4;
|
||
return -rua_error;
|
||
}
|
||
bool fp = false;
|
||
for (int i = 0; i < width; i++) {
|
||
if (!components[i]->implicit) {
|
||
error (0, "explict numeric constant in vector literal."
|
||
" Suggest suffix after closing '.");
|
||
return -rua_error;
|
||
}
|
||
fp |= is_double (get_type (components[i]));
|
||
}
|
||
|
||
// end points at the final ' and thus any suffix is after that
|
||
int expl = parse_suffix (++end, fp);
|
||
if (expl < 0) {
|
||
error (0, "invalid suffix \"%s\" on %s vector constant", end,
|
||
fp ? "floating" : "integer");
|
||
return -rua_error;
|
||
}
|
||
union {
|
||
pr_float_t f[4];
|
||
pr_int_t i[4];
|
||
pr_double_t d[4];
|
||
pr_long_t l[4];
|
||
pr_type_t t[PR_SIZEOF (lvec4)];
|
||
} data;
|
||
type_t *type = 0;
|
||
if (expl == suff_long_double) {
|
||
warning (0, "long double treated as double");
|
||
expl = suff_double;
|
||
}
|
||
if (expl == suff_float) {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
if (is_double (get_type (c))) {
|
||
data.f[i] = expr_double (c);
|
||
} else {
|
||
data.f[i] = expr_long (c);
|
||
}
|
||
if (negate[i]) {
|
||
data.f[i] = -data.f[i];
|
||
}
|
||
}
|
||
type = &type_float;
|
||
} else if (expl == suff_double) {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
if (is_double (get_type (c))) {
|
||
data.d[i] = expr_double (c);
|
||
} else {
|
||
data.d[i] = expr_long (c);
|
||
}
|
||
if (negate[i]) {
|
||
data.d[i] = -data.d[i];
|
||
}
|
||
}
|
||
type = &type_double;
|
||
} else if (expl == suff_implicit) {
|
||
if (fp) {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
if (is_double (get_type (c))) {
|
||
data.f[i] = expr_double (c);
|
||
} else {
|
||
data.f[i] = expr_long (c);
|
||
}
|
||
if (negate[i]) {
|
||
data.f[i] = -data.f[i];
|
||
}
|
||
}
|
||
type = &type_float;
|
||
} else {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
data.i[i] = expr_long (c);
|
||
if (negate[i]) {
|
||
data.i[i] = -data.i[i];
|
||
}
|
||
}
|
||
type = &type_int;
|
||
}
|
||
} else if (expl == suff_unsigned) {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
data.i[i] = fp ? expr_double (c) : expr_long (c);
|
||
if (negate[i]) {
|
||
data.i[i] = -data.i[i];
|
||
}
|
||
}
|
||
type = &type_uint;
|
||
} else if (expl == suff_long || expl == suff_unsigned_long) {
|
||
for (int i = 0; i < width; i++) {
|
||
auto c = components[i];
|
||
data.l[i] = expr_long (c);
|
||
if (negate[i]) {
|
||
data.l[i] = -data.l[i];
|
||
}
|
||
}
|
||
type = expl == suff_unsigned_long ? &type_ulong : &type_long;
|
||
}
|
||
type = vector_type (type, width);
|
||
tok->value.expr = new_value_expr (new_type_value (type, data.t),
|
||
expl == suff_implicit);
|
||
|
||
return VALUE;
|
||
}
|
||
|
||
static int
|
||
parse_string (rua_tok_t *tok, int type, yyscan_t scanner)
|
||
{
|
||
const char *str = make_string (tok->text, 0);
|
||
if (type == rua_char) {
|
||
if (str[1]) {
|
||
warning (0, "multibyte char constant");
|
||
}
|
||
tok->value.expr = new_int_expr (*str, false);
|
||
return VALUE;
|
||
} else {
|
||
tok->value.expr = new_string_expr (str);
|
||
return STRING;
|
||
}
|
||
}
|
||
|
||
static void
|
||
user_action (rua_tok_t *tok, rua_loc_t *loc, const char *text, size_t textlen)
|
||
{
|
||
if (textlen < sizeof (tok->text)) {
|
||
strncpy (tok->str_text, text, textlen);
|
||
tok->str_text[textlen] = 0;
|
||
tok->text = tok->str_text;
|
||
} else {
|
||
tok->text = save_string (text);
|
||
}
|
||
tok->textlen = textlen;
|
||
loc->first_line = loc->last_line;
|
||
loc->first_column = loc->last_column;
|
||
for(int i = 0; text[i] != '\0'; i++) {
|
||
if(text[i] == '\n') {
|
||
loc->last_line++;
|
||
loc->last_column = 1;
|
||
} else {
|
||
loc->last_column++;
|
||
}
|
||
}
|
||
}
|
||
|
||
static int
|
||
qc_process (qc_yypstate *ps, int token, rua_tok_t *tok, yyscan_t scanner)
|
||
{
|
||
auto value = &tok->value;
|
||
auto loc = &tok->location;
|
||
|
||
switch (-token) {
|
||
case rua_number:
|
||
token = parse_number (tok, scanner);
|
||
if (token == VALUE && value->expr->implicit) {
|
||
if (is_long (get_type (value->expr))) {
|
||
pr_long_t v = expr_long (value->expr);
|
||
if (v < INT32_MIN || v > INT32_MAX) {
|
||
warning (0, "integer value truncated");
|
||
}
|
||
value->expr = new_int_expr (v, true);
|
||
}
|
||
}
|
||
break;
|
||
case rua_vector:
|
||
token = parse_vector (tok, scanner);
|
||
break;
|
||
case rua_string:
|
||
case rua_char:
|
||
token = parse_string (tok, -token, scanner);
|
||
break;
|
||
}
|
||
if (token >= 0) {
|
||
return qc_yypush_parse (ps, token, value, loc, scanner);
|
||
}
|
||
return YYPUSH_MORE;
|
||
}
|
||
|
||
int
|
||
qc_yyparse (FILE *in)
|
||
{
|
||
int status;
|
||
yyscan_t scanner;
|
||
qc_yypstate *ps = qc_yypstate_new ();
|
||
rua_tok_t tok = { .location = { 1, 1, 1, 1, pr.source_file }, };
|
||
rua_extra_t extra = {};
|
||
|
||
yylex_init_extra (&extra, &scanner);
|
||
yyset_in (in, scanner);
|
||
do {
|
||
int token = yylex (&tok, &tok.location, scanner);
|
||
status = qc_process (ps, token, &tok, scanner);
|
||
} while (status == YYPUSH_MORE);
|
||
|
||
yylex_destroy (scanner);
|
||
qc_yypstate_delete (ps);
|
||
return status;
|
||
}
|