mirror of
https://github.com/DrBeef/JKXR.git
synced 2024-12-11 21:21:47 +00:00
581 lines
12 KiB
C
581 lines
12 KiB
C
|
/*
|
||
|
===========================================================================
|
||
|
Copyright (C) 2000 - 2013, Raven Software, Inc.
|
||
|
Copyright (C) 2001 - 2013, Activision, Inc.
|
||
|
Copyright (C) 2013 - 2015, OpenJK contributors
|
||
|
|
||
|
This file is part of the OpenJK source code.
|
||
|
|
||
|
OpenJK is free software; you can redistribute it and/or modify it
|
||
|
under the terms of the GNU General Public License version 2 as
|
||
|
published by the Free Software Foundation.
|
||
|
|
||
|
This program is distributed in the hope that it will be useful,
|
||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
GNU General Public License for more details.
|
||
|
|
||
|
You should have received a copy of the GNU General Public License
|
||
|
along with this program; if not, see <http://www.gnu.org/licenses/>.
|
||
|
===========================================================================
|
||
|
*/
|
||
|
|
||
|
// Tokenizer.h
|
||
|
|
||
|
#ifndef __TOKENIZER_H
|
||
|
#define __TOKENIZER_H
|
||
|
|
||
|
#include <string>
|
||
|
#include <string.h>
|
||
|
#include <vector>
|
||
|
#include <map>
|
||
|
|
||
|
typedef unsigned char byte;
|
||
|
typedef unsigned short word;
|
||
|
|
||
|
#define MAX_STRING_LENGTH 256
|
||
|
#define MAX_IDENTIFIER_LENGTH 128
|
||
|
|
||
|
#define TKF_IGNOREDIRECTIVES 0x00000001 // skip over lines starting with #
|
||
|
#define TKF_USES_EOL 0x00000002 // generate end of line tokens
|
||
|
#define TKF_NODIRECTIVES 0x00000004 // don't treat # in any special way
|
||
|
#define TKF_WANTUNDEFINED 0x00000008 // if token not found in symbols create undefined token
|
||
|
#define TKF_WIDEUNDEFINEDSYMBOLS 0x00000010 // when undefined token encountered, accumulate until space
|
||
|
#define TKF_RAWSYMBOLSONLY 0x00000020
|
||
|
#define TKF_NUMERICIDENTIFIERSTART 0x00000040
|
||
|
#define TKF_IGNOREKEYWORDS 0x00000080
|
||
|
#define TKF_NOCASEKEYWORDS 0x00000100
|
||
|
#define TKF_NOUNDERSCOREINIDENTIFIER 0x00000200
|
||
|
#define TKF_NODASHINIDENTIFIER 0x00000400
|
||
|
#define TKF_COMMENTTOKENS 0x00000800
|
||
|
|
||
|
enum
|
||
|
{
|
||
|
TKERR_NONE,
|
||
|
TKERR_UNKNOWN,
|
||
|
TKERR_BUFFERCREATE,
|
||
|
TKERR_UNRECOGNIZEDSYMBOL,
|
||
|
TKERR_DUPLICATESYMBOL,
|
||
|
TKERR_STRINGLENGTHEXCEEDED,
|
||
|
TKERR_IDENTIFIERLENGTHEXCEEDED,
|
||
|
TKERR_EXPECTED_INTEGER,
|
||
|
TKERR_EXPECTED_IDENTIFIER,
|
||
|
TKERR_EXPECTED_STRING,
|
||
|
TKERR_EXPECTED_CHAR,
|
||
|
TKERR_EXPECTED_FLOAT,
|
||
|
TKERR_UNEXPECTED_TOKEN,
|
||
|
TKERR_INVALID_DIRECTIVE,
|
||
|
TKERR_INCLUDE_FILE_NOTFOUND,
|
||
|
TKERR_UNMATCHED_DIRECTIVE,
|
||
|
TKERR_USERERROR,
|
||
|
};
|
||
|
|
||
|
enum
|
||
|
{
|
||
|
TK_EOF = -1,
|
||
|
TK_UNDEFINED,
|
||
|
TK_COMMENT,
|
||
|
TK_EOL,
|
||
|
TK_CHAR,
|
||
|
TK_STRING,
|
||
|
TK_INT,
|
||
|
TK_INTEGER = TK_INT,
|
||
|
TK_FLOAT,
|
||
|
TK_IDENTIFIER,
|
||
|
TK_USERDEF,
|
||
|
};
|
||
|
|
||
|
typedef struct
|
||
|
{
|
||
|
char* m_keyword;
|
||
|
int m_tokenvalue;
|
||
|
} keywordArray_t;
|
||
|
|
||
|
class lessstr
|
||
|
{
|
||
|
public:
|
||
|
bool operator()(const char *str1, const char *str2) const {return (strcmp(str1, str2) < 0);};
|
||
|
};
|
||
|
|
||
|
class CParseStream
|
||
|
{
|
||
|
public:
|
||
|
CParseStream();
|
||
|
~CParseStream();
|
||
|
static CParseStream* Create();
|
||
|
virtual void Delete();
|
||
|
virtual bool NextChar(byte& theByte);
|
||
|
virtual int GetCurLine();
|
||
|
virtual void GetCurFilename(char** theBuff);
|
||
|
virtual long GetRemainingSize();
|
||
|
|
||
|
CParseStream* GetNext();
|
||
|
void SetNext(CParseStream* next);
|
||
|
|
||
|
virtual bool IsThisDefinition(void* theDefinition);
|
||
|
|
||
|
protected:
|
||
|
bool InitBaseStream();
|
||
|
|
||
|
CParseStream* m_next;
|
||
|
};
|
||
|
|
||
|
class CToken
|
||
|
{
|
||
|
public:
|
||
|
CToken();
|
||
|
~CToken();
|
||
|
static CToken* Create();
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
CToken* GetNext();
|
||
|
void SetNext(CToken* theToken);
|
||
|
virtual int GetIntValue();
|
||
|
virtual const char *GetStringValue();
|
||
|
virtual float GetFloatValue();
|
||
|
|
||
|
protected:
|
||
|
virtual void InitBaseToken();
|
||
|
|
||
|
char* m_string;
|
||
|
CToken* m_next;
|
||
|
};
|
||
|
|
||
|
class CCharToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CCharToken();
|
||
|
~CCharToken();
|
||
|
static CCharToken* Create(byte theByte);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(byte theByte);
|
||
|
};
|
||
|
|
||
|
class CStringToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CStringToken();
|
||
|
~CStringToken();
|
||
|
static CStringToken* Create(const char *theString);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *theString);
|
||
|
};
|
||
|
|
||
|
class CIntToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CIntToken();
|
||
|
~CIntToken();
|
||
|
static CIntToken* Create(long value);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
virtual float GetFloatValue();
|
||
|
virtual int GetIntValue();
|
||
|
virtual const char *GetStringValue();
|
||
|
|
||
|
protected:
|
||
|
void Init(long value);
|
||
|
|
||
|
long m_value;
|
||
|
};
|
||
|
|
||
|
class CFloatToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CFloatToken();
|
||
|
~CFloatToken();
|
||
|
static CFloatToken* Create(float value);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
virtual float GetFloatValue();
|
||
|
virtual const char *GetStringValue();
|
||
|
|
||
|
protected:
|
||
|
virtual void Init(float value);
|
||
|
|
||
|
float m_value;
|
||
|
};
|
||
|
|
||
|
class CIdentifierToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CIdentifierToken();
|
||
|
~CIdentifierToken();
|
||
|
static CIdentifierToken* Create(const char *name);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *name);
|
||
|
};
|
||
|
|
||
|
class CCommentToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CCommentToken();
|
||
|
~CCommentToken();
|
||
|
static CCommentToken* Create(const char *name);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *name);
|
||
|
};
|
||
|
|
||
|
class CUserToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CUserToken();
|
||
|
~CUserToken();
|
||
|
static CUserToken* Create(int value, const char *string);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(int value, const char *string);
|
||
|
|
||
|
int m_value;
|
||
|
};
|
||
|
|
||
|
class CUndefinedToken : public CToken
|
||
|
{
|
||
|
public:
|
||
|
CUndefinedToken();
|
||
|
~CUndefinedToken();
|
||
|
static CUndefinedToken* Create(const char *string);
|
||
|
virtual void Delete();
|
||
|
|
||
|
virtual int GetType();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *string);
|
||
|
};
|
||
|
|
||
|
class CSymbol
|
||
|
{
|
||
|
public:
|
||
|
CSymbol();
|
||
|
virtual ~CSymbol();
|
||
|
static CSymbol* Create(const char *symbolName);
|
||
|
virtual void Delete();
|
||
|
|
||
|
const char *GetName();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *symbolName);
|
||
|
|
||
|
char* m_symbolName;
|
||
|
};
|
||
|
|
||
|
typedef std::map<const char *, CSymbol*, lessstr> symbolmap_t;
|
||
|
|
||
|
class CDirectiveSymbol : public CSymbol
|
||
|
{
|
||
|
public:
|
||
|
CDirectiveSymbol();
|
||
|
~CDirectiveSymbol();
|
||
|
static CDirectiveSymbol* Create(const char *symbolName);
|
||
|
virtual void Delete();
|
||
|
|
||
|
void SetValue(const char *value);
|
||
|
const char *GetValue();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *symbolName);
|
||
|
|
||
|
char* m_value;
|
||
|
};
|
||
|
|
||
|
class CIntSymbol : public CSymbol
|
||
|
{
|
||
|
public:
|
||
|
CIntSymbol();
|
||
|
static CIntSymbol* Create(const char *symbolName, int value);
|
||
|
virtual void Delete();
|
||
|
|
||
|
int GetValue();
|
||
|
|
||
|
protected:
|
||
|
void Init(const char *symbolName, int value);
|
||
|
|
||
|
int m_value;
|
||
|
};
|
||
|
|
||
|
class CSymbolTable
|
||
|
{
|
||
|
public:
|
||
|
CSymbolTable();
|
||
|
~CSymbolTable();
|
||
|
static CSymbolTable* Create();
|
||
|
void Delete();
|
||
|
|
||
|
bool AddSymbol(CSymbol* theSymbol);
|
||
|
CSymbol* FindSymbol(const char *symbolName);
|
||
|
CSymbol* ExtractSymbol(const char *symbolName);
|
||
|
void RemoveSymbol(const char *symbolName);
|
||
|
void DiscardSymbols();
|
||
|
|
||
|
protected:
|
||
|
void Init();
|
||
|
symbolmap_t m_symbols;
|
||
|
};
|
||
|
|
||
|
class CSymbolLookup
|
||
|
{
|
||
|
public:
|
||
|
CSymbolLookup();
|
||
|
~CSymbolLookup();
|
||
|
static CSymbolLookup* Create(byte theByte);
|
||
|
virtual void Delete();
|
||
|
CSymbolLookup* GetNext();
|
||
|
void SetNext(CSymbolLookup* next);
|
||
|
void SetParent(CSymbolLookup* parent);
|
||
|
CSymbolLookup* GetParent();
|
||
|
CSymbolLookup** GetChildAddress();
|
||
|
CSymbolLookup* GetChild();
|
||
|
void SetValue(int value);
|
||
|
int GetValue();
|
||
|
byte GetByte();
|
||
|
|
||
|
protected:
|
||
|
void Init(byte theByte);
|
||
|
|
||
|
CSymbolLookup* m_child;
|
||
|
CSymbolLookup* m_sibling;
|
||
|
CSymbolLookup* m_parent;
|
||
|
int m_value;
|
||
|
byte m_byte;
|
||
|
};
|
||
|
|
||
|
class CTokenizerState
|
||
|
{
|
||
|
public:
|
||
|
CTokenizerState();
|
||
|
~CTokenizerState();
|
||
|
static CTokenizerState* Create(bool skip);
|
||
|
virtual void Delete();
|
||
|
CTokenizerState* GetNext();
|
||
|
void SetNext(CTokenizerState* next);
|
||
|
virtual bool ProcessElse();
|
||
|
bool Skipping();
|
||
|
|
||
|
protected:
|
||
|
void Init(bool skip);
|
||
|
|
||
|
bool m_skip;
|
||
|
bool m_elseHit;
|
||
|
CTokenizerState* m_next;
|
||
|
};
|
||
|
|
||
|
class CTokenizerHolderState : public CTokenizerState
|
||
|
{
|
||
|
public:
|
||
|
CTokenizerHolderState();
|
||
|
~CTokenizerHolderState();
|
||
|
static CTokenizerHolderState* Create();
|
||
|
virtual void Delete();
|
||
|
virtual bool ProcessElse();
|
||
|
|
||
|
protected:
|
||
|
void Init();
|
||
|
};
|
||
|
|
||
|
typedef void (*LPTokenizerErrorProc)(const char *errString);
|
||
|
|
||
|
#ifdef USES_MODULES
|
||
|
class CTokenizer : public CModule
|
||
|
#else
|
||
|
class CTokenizer
|
||
|
#endif
|
||
|
{
|
||
|
public:
|
||
|
CTokenizer();
|
||
|
~CTokenizer();
|
||
|
static CTokenizer* Create(unsigned dwFlags = 0);
|
||
|
virtual void Delete();
|
||
|
virtual void Error(int theError);
|
||
|
virtual void Error(int theError, const char *errString);
|
||
|
virtual void Error(const char *errString, int theError = TKERR_UNKNOWN);
|
||
|
|
||
|
CToken* GetToken(unsigned onFlags = 0, unsigned offFlags = 0);
|
||
|
CToken* GetToken(keywordArray_t* keywords, unsigned onFlags, unsigned offFlags);
|
||
|
void PutBackToken(CToken* theToken, bool commented = false, const char *addedChars = NULL, bool bIgnoreThisTokenType = false);
|
||
|
bool RequireToken(int tokenType);
|
||
|
void ScanUntilToken(int tokenType);
|
||
|
void SkipToLineEnd();
|
||
|
CToken* GetToEndOfLine(int tokenType = TK_IDENTIFIER);
|
||
|
|
||
|
keywordArray_t* SetKeywords(keywordArray_t* theKeywords);
|
||
|
void SetSymbols(keywordArray_t* theSymbols);
|
||
|
void SetAdditionalErrors(keywordArray_t* theErrors);
|
||
|
void SetErrorProc(LPTokenizerErrorProc errorProc);
|
||
|
void AddParseStream(byte* data, long datasize);
|
||
|
bool AddParseFile(const char *filename);
|
||
|
unsigned int ParseRGB();
|
||
|
long GetRemainingSize();
|
||
|
|
||
|
unsigned GetFlags();
|
||
|
void SetFlags(unsigned flags);
|
||
|
|
||
|
void GetCurFilename(char** filename);
|
||
|
int GetCurLine();
|
||
|
|
||
|
const char *LookupToken(int tokenID, keywordArray_t* theTable = NULL);
|
||
|
|
||
|
protected:
|
||
|
void SetError(int theError, const char *errString);
|
||
|
virtual void Init(unsigned dwFlags = 0);
|
||
|
CToken* FetchToken();
|
||
|
bool AddDefineSymbol(CDirectiveSymbol* definesymbol);
|
||
|
bool NextChar(byte& theByte);
|
||
|
byte Escapement();
|
||
|
void InsertSymbol(const char *theSymbol, int theValue);
|
||
|
void PutBackChar(byte theByte, int curLine = 0, const char *filename = NULL);
|
||
|
CToken* TokenFromName(const char *name);
|
||
|
CToken* HandleDirective();
|
||
|
CToken* HandleSlash();
|
||
|
CToken* HandleString();
|
||
|
CToken* HandleQuote();
|
||
|
CToken* HandleIdentifier(byte theByte);
|
||
|
CToken* HandleNumeric(byte theByte);
|
||
|
CToken* HandleFloat(bool thesign = false, long value = 0);
|
||
|
CToken* HandleDecimal(bool thesign = false);
|
||
|
CToken* HandleSymbol(byte theByte);
|
||
|
CToken* HandleHex(bool thesize);
|
||
|
CToken* HandleOctal(bool thesize);
|
||
|
int DirectiveFromName(const char *name);
|
||
|
|
||
|
CParseStream* m_curParseStream;
|
||
|
keywordArray_t* m_keywords;
|
||
|
keywordArray_t* m_symbols;
|
||
|
keywordArray_t* m_errors;
|
||
|
CSymbolLookup* m_symbolLookup;
|
||
|
CToken* m_nextToken;
|
||
|
CSymbolTable m_defines;
|
||
|
CTokenizerState* m_state;
|
||
|
unsigned m_flags;
|
||
|
LPTokenizerErrorProc m_errorProc;
|
||
|
|
||
|
static keywordArray_t errorMessages[];
|
||
|
static keywordArray_t directiveKeywords[];
|
||
|
};
|
||
|
|
||
|
class CKeywordTable
|
||
|
{
|
||
|
public:
|
||
|
CKeywordTable(CTokenizer* tokenizer, keywordArray_t* keywords);
|
||
|
~CKeywordTable();
|
||
|
|
||
|
protected:
|
||
|
CTokenizer* m_tokenizer;
|
||
|
keywordArray_t* m_holdKeywords;
|
||
|
};
|
||
|
|
||
|
class CParsePutBack : public CParseStream
|
||
|
{
|
||
|
public:
|
||
|
CParsePutBack();
|
||
|
~CParsePutBack();
|
||
|
static CParsePutBack* Create(byte theByte, int curLine, const char *filename);
|
||
|
virtual void Delete();
|
||
|
virtual bool NextChar(byte& theByte);
|
||
|
virtual int GetCurLine();
|
||
|
virtual void GetCurFilename(char** theBuff);
|
||
|
virtual long GetRemainingSize();
|
||
|
|
||
|
protected:
|
||
|
void Init(byte theByte, int curLine, const char *filename);
|
||
|
|
||
|
byte m_byte;
|
||
|
bool m_consumed;
|
||
|
int m_curLine;
|
||
|
char* m_curFile;
|
||
|
};
|
||
|
|
||
|
class CParseMemory : public CParseStream
|
||
|
{
|
||
|
public:
|
||
|
CParseMemory();
|
||
|
~CParseMemory();
|
||
|
static CParseMemory* Create(byte* data, long datasize);
|
||
|
virtual void Delete();
|
||
|
virtual bool NextChar(byte& theByte);
|
||
|
virtual int GetCurLine();
|
||
|
virtual void GetCurFilename(char** theBuff);
|
||
|
virtual long GetRemainingSize();
|
||
|
|
||
|
protected:
|
||
|
void Init(byte* data, long datasize);
|
||
|
|
||
|
byte* m_data;
|
||
|
int m_curLine;
|
||
|
long m_curPos;
|
||
|
long m_datasize;
|
||
|
long m_offset;
|
||
|
};
|
||
|
|
||
|
class CParseBlock : public CParseMemory
|
||
|
{
|
||
|
public:
|
||
|
CParseBlock();
|
||
|
~CParseBlock();
|
||
|
static CParseBlock* Create(byte* data, long datasize);
|
||
|
virtual void Delete();
|
||
|
|
||
|
protected:
|
||
|
virtual void Init(byte* data, long datasize);
|
||
|
};
|
||
|
|
||
|
class CParseToken : public CParseStream
|
||
|
{
|
||
|
public:
|
||
|
CParseToken();
|
||
|
~CParseToken();
|
||
|
static CParseToken* Create(CToken* token);
|
||
|
virtual void Delete();
|
||
|
virtual bool NextChar(byte& theByte);
|
||
|
virtual int GetCurLine();
|
||
|
virtual void GetCurFilename(char** theBuff);
|
||
|
virtual long GetRemainingSize();
|
||
|
|
||
|
protected:
|
||
|
void Init(CToken* token);
|
||
|
|
||
|
byte* m_data;
|
||
|
int m_curLine;
|
||
|
long m_curPos;
|
||
|
long m_datasize;
|
||
|
long m_offset;
|
||
|
};
|
||
|
|
||
|
class CParseDefine : public CParseMemory
|
||
|
{
|
||
|
public:
|
||
|
CParseDefine();
|
||
|
~CParseDefine();
|
||
|
static CParseDefine* Create(CDirectiveSymbol* definesymbol);
|
||
|
virtual void Delete();
|
||
|
virtual bool IsThisDefinition(void* theDefinition);
|
||
|
|
||
|
protected:
|
||
|
virtual void Init(CDirectiveSymbol* definesymbol);
|
||
|
|
||
|
CDirectiveSymbol* m_defineSymbol;
|
||
|
};
|
||
|
|
||
|
#endif//__TOKENIZER_H
|