/* * File Tokeniser/Parser/Whatever * by Jonathon Fowler * Remixed completely by Ken Silverman * See the included license file "BUILDLIC.TXT" for license info. */ #include "compat.h" #include "scriptfile.h" #include "baselayer.h" #include "compat.h" #include "common.h" #include "filesystem.h" #define ISWS(x) ((x == ' ') || (x == '\t') || (x == '\r') || (x == '\n')) static inline void skipoverws(scriptfile *sf) { if ((sf->textptr < sf->eof) && (!sf->textptr[0])) sf->textptr++; } static inline void skipovertoken(scriptfile *sf) { while ((sf->textptr < sf->eof) && (sf->textptr[0])) sf->textptr++; } char *scriptfile_gettoken(scriptfile *sf) { if (scriptfile_eof(sf)) return NULL; char *start = sf->ltextptr = sf->textptr; skipovertoken(sf); return start; } static int scriptfile_eof_error(scriptfile *sf) { if (scriptfile_eof(sf)) { Printf("Error on line %s:%d: unexpected eof\n", sf->filename, scriptfile_getlinum(sf, sf->textptr)); return -1; } return 0; } int32_t scriptfile_getstring(scriptfile *sf, char **retst) { (*retst) = scriptfile_gettoken(sf); if (*retst == NULL) { Printf("Error on line %s:%d: unexpected eof\n",sf->filename,scriptfile_getlinum(sf,sf->textptr)); return -2; } return 0; } int32_t scriptfile_getnumber(scriptfile *sf, int32_t *num) { if (scriptfile_eof_error(sf)) return -1; while ((sf->textptr[0] == '0') && isdigit(sf->textptr[1])) sf->textptr++; //hack to treat octal numbers like decimal sf->ltextptr = sf->textptr; (*num) = strtol((const char *)sf->textptr,&sf->textptr,0); if (!ISWS(*sf->textptr) && *sf->textptr) { char *p = sf->textptr; skipovertoken(sf); Printf("Error on line %s:%d: expecting int32_t, got \"%s\"\n",sf->filename,scriptfile_getlinum(sf,sf->ltextptr),p); return -2; } return 0; } static double parsedouble(char *ptr, char **end) { int32_t beforedecimal = 1, negative = 0, dig; int32_t exposgn = 0, expo = 0; double num = 0.0, decpl = 0.1; char *p; p = ptr; if (*p == '-') negative = 1, p++; else if (*p == '+') p++; for (;; p++) { if (isdigit(*p)) { dig = *p - '0'; if (beforedecimal) num = num * 10.0 + dig; else if (exposgn) expo = expo*10 + dig; else { num += (double)dig * decpl; decpl /= 10.0; } } else if (*p == '.') { if (beforedecimal) beforedecimal = 0; else break; } else if ((*p == 'E') || (*p == 'e')) { exposgn = 1; if (p[1] == '-') { exposgn = -1; p++; } else if (p[1] == '+') p++; } else break; } if (end) *end = p; if (exposgn) num *= pow(10.0,(double)(expo*exposgn)); return negative ? -num : num; } int32_t scriptfile_getdouble(scriptfile *sf, double *num) { if (scriptfile_eof_error(sf)) return -1; sf->ltextptr = sf->textptr; // On Linux, locale settings interfere with interpreting x.y format numbers //(*num) = strtod((const char *)sf->textptr,&sf->textptr); (*num) = parsedouble(sf->textptr, &sf->textptr); if (!ISWS(*sf->textptr) && *sf->textptr) { char *p = sf->textptr; skipovertoken(sf); Printf("Error on line %s:%d: expecting float, got \"%s\"\n",sf->filename,scriptfile_getlinum(sf,sf->ltextptr),p); return -2; } return 0; } int scriptfile_getsymbol(scriptfile *sf, int32_t *num) { char *t = scriptfile_gettoken(sf); if (!t) return -1; char * e; int32_t v = Bstrtol(t, &e, 10); if (*e) { // looks like a string, so find it in the symbol table if (scriptfile_getsymbolvalue(t, num)) return 0; Printf("Error on line %s:%d: expecting symbol, got \"%s\"\n", sf->filename, scriptfile_getlinum(sf, sf->ltextptr), t); return -2; } *num = v; return 0; } int32_t scriptfile_getbraces(scriptfile *sf, char **braceend) { if (scriptfile_eof_error(sf)) return -1; if (sf->textptr[0] != '{') { Printf("Error on line %s:%d: expecting '{'\n",sf->filename,scriptfile_getlinum(sf,sf->textptr)); return -1; } char *bracestart = ++sf->textptr; int bracecnt = 1; do { if (sf->textptr >= sf->eof) return 0; else if (sf->textptr[0] == '{') bracecnt++; else if (sf->textptr[0] == '}') if (!(--bracecnt)) break; sf->textptr++; } while (1); (*braceend) = sf->textptr; sf->textptr = bracestart; return 0; } int32_t scriptfile_getlinum(const scriptfile *sf, const char *ptr) { int32_t i, stp; intptr_t ind; //for(i=0;ilinenum;i++) if (sf->lineoffs[i] >= ind) return i+1; //brute force algo ind = ((intptr_t)ptr) - ((intptr_t)sf->textbuf); for (stp=1; stp+stplinenum; stp+=stp) { } //stp = highest power of 2 less than sf->linenum for (i=0; stp; stp>>=1) if ((i+stp-1 < sf->linenum) && (sf->lineoffs[i+stp-1] < ind)) i += stp; return i+1; //i = index to highest lineoffs which is less than ind; convert to 1-based line numbers } void scriptfile_preparse(scriptfile *sf, char *tx, int32_t flen) { int32_t i, cr, numcr, nflen, ws, cs, inquote; //Count number of lines numcr = 1; for (i=0; ilinenum = numcr; sf->lineoffs = (int32_t *)Xmalloc(sf->linenum*sizeof(int32_t)); //Preprocess file for comments (// and /*...*/, and convert all whitespace to single spaces) nflen = 0; ws = 0; cs = 0; numcr = 0; inquote = 0; for (i=0; ilineoffs[numcr++] = nflen; if (cs == 1) cs = 0; ws = 1; continue; //strip CR/LF } if ((!inquote) && ((tx[i] == ' ') || (tx[i] == '\t'))) { ws = 1; continue; } // strip Space/Tab if ((tx[i] == '/') && (tx[i + 1] == '/') && (!cs)) cs = 1; if ((tx[i] == '/') && (tx[i + 1] == '*') && (!cs)) { ws = 1; cs = 2; } if ((tx[i] == '*') && (tx[i + 1] == '/') && (cs == 2)) { cs = 0; i++; continue; } if (cs) continue; if (ws) tx[nflen++] = ws = 0; //quotes inside strings: \" if ((tx[i] == '\\') && (tx[i+1] == '\"')) { i++; tx[nflen++] = '\"'; continue; } if (tx[i] == '\"') { inquote ^= 1; continue; } tx[nflen++] = tx[i]; } tx[nflen++] = 0; sf->lineoffs[numcr] = nflen; tx[nflen++] = 0; #if 0 //for debugging only: printf("pre-parsed file:flen=%d,nflen=%d\n",flen,nflen); for (i=0; ilinenum); for (i=0; ilinenum; i++) printf("line %d = byte %d\n",i,sf->lineoffs[i]); #endif sf->textbuf = sf->textptr = tx; sf->textlength = nflen; sf->eof = &sf->textbuf[nflen-1]; } scriptfile *scriptfile_fromfile(const char *fn) { auto fr = fileSystem.OpenFileReader(fn); if (!fr.isOpen()) return nullptr; uint32_t flen = fr.GetLength(); char * tx = (char *)Xmalloc(flen + 2); scriptfile *sf = (scriptfile *)Xmalloc(sizeof(scriptfile)); fr.Read(tx, flen); tx[flen] = tx[flen+1] = 0; scriptfile_preparse(sf,tx,flen); sf->filename = Xstrdup(fn); return sf; } scriptfile *scriptfile_fromstring(const char *string) { if (!string) return nullptr; uint32_t flen = Bstrlen(string); char * tx = (char *)Xmalloc(flen + 2); scriptfile *sf = (scriptfile *)Xmalloc(sizeof(scriptfile)); Bmemcpy(tx, string, flen); tx[flen] = tx[flen+1] = 0; scriptfile_preparse(sf,tx,flen); sf->filename = NULL; return sf; } void scriptfile_close(scriptfile *sf) { if (!sf) return; Xfree(sf->lineoffs); Xfree(sf->textbuf); Xfree(sf->filename); Xfree(sf); } int scriptfile_eof(scriptfile *sf) { skipoverws(sf); return !!(sf->textptr >= sf->eof); } #define SYMBTABSTARTSIZE 256 static int32_t symbtablength=0, symbtaballoclength=0; static char *symbtab = NULL; static char *getsymbtabspace(int32_t reqd) { char *pos,*np; int32_t i; if (symbtablength + reqd > symbtaballoclength) { for (i=max(symbtaballoclength,SYMBTABSTARTSIZE); symbtablength+reqd>i; i<<=1) { } np = (char *)Xrealloc(symbtab, i); symbtab = np; symbtaballoclength = i; } pos = &symbtab[symbtablength]; symbtablength += reqd; return pos; } int32_t scriptfile_getsymbolvalue(char const *name, int32_t *val) { if (Bstrlen(name) > 2) { if (name[0] == '0' && tolower(name[1]) == 'x') // hex constants { uint64_t x; sscanf(name + 2, "%" PRIx64 "", &x); if (EDUKE32_PREDICT_FALSE(x > UINT32_MAX)) Printf("warning: number 0x%x" PRIx64 " truncated to 32 bits.\n", x); *val = x; return 1; } } char *scanner = symbtab; if (!symbtab) return 0; while (scanner - symbtab < symbtablength) { if (!Bstrcasecmp(name, scanner)) { *val = B_UNBUF32(scanner + strlen(scanner) + 1); return 1; } scanner += strlen(scanner) + 1 + sizeof(int32_t); } return 0; } int32_t scriptfile_addsymbolvalue(char const *name, int32_t val) { char *sp; // if (scriptfile_getsymbolvalue(name, &x)) return -1; // already exists if (symbtab) { char *scanner = symbtab; while (scanner - symbtab < symbtablength) { if (!Bstrcasecmp(name, scanner)) { B_BUF32(scanner + strlen(scanner) + 1, val); return 1; } scanner += strlen(scanner) + 1 + sizeof(int32_t); } } sp = getsymbtabspace(strlen(name) + 1 + sizeof(int32_t)); if (!sp) return 0; strcpy(sp, name); sp += strlen(name)+1; B_BUF32(sp, val); return 1; // added } void scriptfile_clearsymbols(void) { DO_FREE_AND_NULL(symbtab); symbtablength = 0; symbtaballoclength = 0; } int32_t getatoken(scriptfile *sf, const tokenlist *tl, int32_t ntokens) { char *tok; int32_t i; if (!sf) return T_ERROR; tok = scriptfile_gettoken(sf); if (!tok) return T_EOF; for (i=ntokens-1; i>=0; i--) { if (!Bstrcasecmp(tok, tl[i].text)) return tl[i].tokenid; } return T_ERROR; }