mirror of
https://github.com/UberGames/GtkRadiant.git
synced 2024-11-27 06:02:29 +00:00
384 lines
7.6 KiB
C
384 lines
7.6 KiB
C
|
/*
|
||
|
Copyright (C) 2001-2006, William Joseph.
|
||
|
All Rights Reserved.
|
||
|
|
||
|
This file is part of GtkRadiant.
|
||
|
|
||
|
GtkRadiant is free software; you can redistribute it and/or modify
|
||
|
it under the terms of the GNU General Public License as published by
|
||
|
the Free Software Foundation; either version 2 of the License, or
|
||
|
(at your option) any later version.
|
||
|
|
||
|
GtkRadiant is distributed in the hope that it will be useful,
|
||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
GNU General Public License for more details.
|
||
|
|
||
|
You should have received a copy of the GNU General Public License
|
||
|
along with GtkRadiant; if not, write to the Free Software
|
||
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*/
|
||
|
|
||
|
#if !defined(INCLUDED_SCRIPT_SCRIPTTOKENISER_H)
|
||
|
#define INCLUDED_SCRIPT_SCRIPTTOKENISER_H
|
||
|
|
||
|
#include "iscriplib.h"
|
||
|
|
||
|
class ScriptTokeniser : public Tokeniser
|
||
|
{
|
||
|
enum CharType
|
||
|
{
|
||
|
eWhitespace,
|
||
|
eCharToken,
|
||
|
eNewline,
|
||
|
eCharQuote,
|
||
|
eCharSolidus,
|
||
|
eCharStar,
|
||
|
eCharSpecial,
|
||
|
};
|
||
|
|
||
|
typedef bool (ScriptTokeniser::*Tokenise)(char c);
|
||
|
|
||
|
Tokenise m_stack[3];
|
||
|
Tokenise* m_state;
|
||
|
SingleCharacterInputStream<TextInputStream> m_istream;
|
||
|
std::size_t m_scriptline;
|
||
|
std::size_t m_scriptcolumn;
|
||
|
|
||
|
char m_token[MAXTOKEN];
|
||
|
char* m_write;
|
||
|
|
||
|
char m_current;
|
||
|
bool m_eof;
|
||
|
bool m_crossline;
|
||
|
bool m_unget;
|
||
|
bool m_emit;
|
||
|
|
||
|
bool m_special;
|
||
|
|
||
|
CharType charType(const char c)
|
||
|
{
|
||
|
switch(c)
|
||
|
{
|
||
|
case '\n': return eNewline;
|
||
|
case '"': return eCharQuote;
|
||
|
case '/': return eCharSolidus;
|
||
|
case '*': return eCharStar;
|
||
|
case '{': case '(': case '}': case ')': case '[': case ']': case ',': case ':': return (m_special) ? eCharSpecial : eCharToken;
|
||
|
}
|
||
|
|
||
|
if(c > 32)
|
||
|
{
|
||
|
return eCharToken;
|
||
|
}
|
||
|
return eWhitespace;
|
||
|
}
|
||
|
|
||
|
Tokenise state()
|
||
|
{
|
||
|
return *m_state;
|
||
|
}
|
||
|
void push(Tokenise state)
|
||
|
{
|
||
|
ASSERT_MESSAGE(m_state != m_stack + 2, "token parser: illegal stack push");
|
||
|
*(++m_state) = state;
|
||
|
}
|
||
|
void pop()
|
||
|
{
|
||
|
ASSERT_MESSAGE(m_state != m_stack, "token parser: illegal stack pop");
|
||
|
--m_state;
|
||
|
}
|
||
|
void add(const char c)
|
||
|
{
|
||
|
if(m_write < m_token + MAXTOKEN - 1)
|
||
|
{
|
||
|
*m_write++ = c;
|
||
|
}
|
||
|
}
|
||
|
void remove()
|
||
|
{
|
||
|
ASSERT_MESSAGE(m_write > m_token, "no char to remove");
|
||
|
--m_write;
|
||
|
}
|
||
|
|
||
|
bool tokeniseDefault(char c)
|
||
|
{
|
||
|
switch(charType(c))
|
||
|
{
|
||
|
case eNewline:
|
||
|
if(!m_crossline)
|
||
|
{
|
||
|
globalErrorStream() << Unsigned(getLine()) << ":" << Unsigned(getColumn()) << ": unexpected end-of-line before token\n";
|
||
|
return false;
|
||
|
}
|
||
|
break;
|
||
|
case eCharToken:
|
||
|
case eCharStar:
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseToken));
|
||
|
add(c);
|
||
|
break;
|
||
|
case eCharSpecial:
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseSpecial));
|
||
|
add(c);
|
||
|
break;
|
||
|
case eCharQuote:
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseQuotedToken));
|
||
|
break;
|
||
|
case eCharSolidus:
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseSolidus));
|
||
|
break;
|
||
|
default:
|
||
|
break;
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseToken(char c)
|
||
|
{
|
||
|
switch(charType(c))
|
||
|
{
|
||
|
case eNewline:
|
||
|
case eWhitespace:
|
||
|
case eCharQuote:
|
||
|
case eCharSpecial:
|
||
|
pop();
|
||
|
m_emit = true; // emit token
|
||
|
break;
|
||
|
case eCharSolidus:
|
||
|
#if 0 //SPoG: ignore comments in the middle of tokens.
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseSolidus));
|
||
|
break;
|
||
|
#endif
|
||
|
case eCharToken:
|
||
|
case eCharStar:
|
||
|
add(c);
|
||
|
break;
|
||
|
default:
|
||
|
break;
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseQuotedToken(char c)
|
||
|
{
|
||
|
switch(charType(c))
|
||
|
{
|
||
|
case eNewline:
|
||
|
if(m_crossline)
|
||
|
{
|
||
|
globalErrorStream() << Unsigned(getLine()) << ":" << Unsigned(getColumn()) << ": unexpected end-of-line in quoted token\n";
|
||
|
return false;
|
||
|
}
|
||
|
break;
|
||
|
case eWhitespace:
|
||
|
case eCharToken:
|
||
|
case eCharSolidus:
|
||
|
case eCharStar:
|
||
|
case eCharSpecial:
|
||
|
add(c);
|
||
|
break;
|
||
|
case eCharQuote:
|
||
|
pop();
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseEndQuote));
|
||
|
break;
|
||
|
default:
|
||
|
break;
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseSolidus(char c)
|
||
|
{
|
||
|
switch(charType(c))
|
||
|
{
|
||
|
case eNewline:
|
||
|
case eWhitespace:
|
||
|
case eCharQuote:
|
||
|
case eCharSpecial:
|
||
|
pop();
|
||
|
add('/');
|
||
|
m_emit = true; // emit single slash
|
||
|
break;
|
||
|
case eCharToken:
|
||
|
pop();
|
||
|
add('/');
|
||
|
add(c);
|
||
|
break;
|
||
|
case eCharSolidus:
|
||
|
pop();
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseComment));
|
||
|
break; // dont emit single slash
|
||
|
case eCharStar:
|
||
|
pop();
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseBlockComment));
|
||
|
break; // dont emit single slash
|
||
|
default:
|
||
|
break;
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseComment(char c)
|
||
|
{
|
||
|
if(c == '\n')
|
||
|
{
|
||
|
pop();
|
||
|
if(state() == Tokenise(&ScriptTokeniser::tokeniseToken))
|
||
|
{
|
||
|
pop();
|
||
|
m_emit = true; // emit token immediatly preceding comment
|
||
|
}
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseBlockComment(char c)
|
||
|
{
|
||
|
if(c == '*')
|
||
|
{
|
||
|
pop();
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseEndBlockComment));
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseEndBlockComment(char c)
|
||
|
{
|
||
|
switch(c)
|
||
|
{
|
||
|
case '/':
|
||
|
pop();
|
||
|
if(state() == Tokenise(&ScriptTokeniser::tokeniseToken))
|
||
|
{
|
||
|
pop();
|
||
|
m_emit = true; // emit token immediatly preceding comment
|
||
|
}
|
||
|
break; // dont emit comment
|
||
|
case '*':
|
||
|
break; // no state change
|
||
|
default:
|
||
|
pop();
|
||
|
push(Tokenise(&ScriptTokeniser::tokeniseBlockComment));
|
||
|
break;
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseEndQuote(char c)
|
||
|
{
|
||
|
pop();
|
||
|
m_emit = true; // emit quoted token
|
||
|
return true;
|
||
|
}
|
||
|
bool tokeniseSpecial(char c)
|
||
|
{
|
||
|
pop();
|
||
|
m_emit = true; // emit single-character token
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
/// Returns true if a token was successfully parsed.
|
||
|
bool tokenise()
|
||
|
{
|
||
|
m_write = m_token;
|
||
|
while(!eof())
|
||
|
{
|
||
|
char c = m_current;
|
||
|
|
||
|
if(!((*this).*state())(c))
|
||
|
{
|
||
|
// parse error
|
||
|
m_eof = true;
|
||
|
return false;
|
||
|
}
|
||
|
if(m_emit)
|
||
|
{
|
||
|
m_emit = false;
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
if(c == '\n')
|
||
|
{
|
||
|
++m_scriptline;
|
||
|
m_scriptcolumn = 1;
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
++m_scriptcolumn;
|
||
|
}
|
||
|
|
||
|
m_eof = !m_istream.readChar(m_current);
|
||
|
}
|
||
|
return m_write != m_token;
|
||
|
}
|
||
|
|
||
|
const char* fillToken()
|
||
|
{
|
||
|
if(!tokenise())
|
||
|
{
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
add('\0');
|
||
|
return m_token;
|
||
|
}
|
||
|
|
||
|
bool eof()
|
||
|
{
|
||
|
return m_eof;
|
||
|
}
|
||
|
|
||
|
public:
|
||
|
ScriptTokeniser(TextInputStream& istream, bool special)
|
||
|
: m_state(m_stack),
|
||
|
m_istream(istream),
|
||
|
m_scriptline(1),
|
||
|
m_scriptcolumn(1),
|
||
|
m_crossline(false),
|
||
|
m_unget(false),
|
||
|
m_emit(false),
|
||
|
m_special(special)
|
||
|
{
|
||
|
m_stack[0] = Tokenise(&ScriptTokeniser::tokeniseDefault);
|
||
|
m_eof = !m_istream.readChar(m_current);
|
||
|
m_token[MAXTOKEN - 1] = '\0';
|
||
|
}
|
||
|
void release()
|
||
|
{
|
||
|
delete this;
|
||
|
}
|
||
|
void nextLine()
|
||
|
{
|
||
|
m_crossline = true;
|
||
|
}
|
||
|
const char* getToken()
|
||
|
{
|
||
|
if(m_unget)
|
||
|
{
|
||
|
m_unget = false;
|
||
|
return m_token;
|
||
|
}
|
||
|
|
||
|
return fillToken();
|
||
|
}
|
||
|
void ungetToken()
|
||
|
{
|
||
|
ASSERT_MESSAGE(!m_unget, "can't unget more than one token");
|
||
|
m_unget = true;
|
||
|
}
|
||
|
std::size_t getLine() const
|
||
|
{
|
||
|
return m_scriptline;
|
||
|
}
|
||
|
std::size_t getColumn() const
|
||
|
{
|
||
|
return m_scriptcolumn;
|
||
|
}
|
||
|
};
|
||
|
|
||
|
|
||
|
inline Tokeniser& NewScriptTokeniser(TextInputStream& istream)
|
||
|
{
|
||
|
return *(new ScriptTokeniser(istream, true));
|
||
|
}
|
||
|
|
||
|
inline Tokeniser& NewSimpleTokeniser(TextInputStream& istream)
|
||
|
{
|
||
|
return *(new ScriptTokeniser(istream, false));
|
||
|
}
|
||
|
|
||
|
#endif
|