Context Navigation

OgreCompiler2Pass.cpp @ 692

Revision 692, 60.0 KB checked in by mattausch, 19 years ago (diff)
adding ogre 1.2 and dependencies

Rev	Line
[692]	1	/*
	2	-----------------------------------------------------------------------------
	3	This source file is part of OGRE
	4	(Object-oriented Graphics Rendering Engine)
	5	For the latest info, see http://www.stevestreeting.com/ogre/
	6
	7	Copyright (c) 2000-2005 The OGRE Team
	8	Also see acknowledgements in Readme.html
	9
	10	This program is free software; you can redistribute it and/or modify it under
	11	the terms of the GNU General Public License as published by the Free Software
	12	Foundation; either version 2 of the License, or (at your option) any later
	13	version.
	14
	15	This program is distributed in the hope that it will be useful, but WITHOUT
	16	ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
	17	FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
	18
	19	You should have received a copy of the GNU General Public License along with
	20	this program; if not, write to the Free Software Foundation, Inc., 59 Temple
	21	Place - Suite 330, Boston, MA 02111-1307, USA, or go to
	22	http://www.gnu.org/copyleft/gpl.html.
	23	-----------------------------------------------------------------------------
	24	*/
	25	#include "OgreStableHeaders.h"
	26	#include "OgreCompiler2Pass.h"
	27	#include "OgreLogManager.h"
	28	#include "OgreException.h"
	29	#include "OgreStringConverter.h"
	30
	31	namespace Ogre {
	32	//-----------------------------------------------------------------------
	33	// instantiate static members
	34	Compiler2Pass::TokenState Compiler2Pass::mBNFTokenState;
	35	Compiler2Pass::TokenStateContainer Compiler2Pass::mClientTokenStates;
	36	//-----------------------------------------------------------------------
	37	Compiler2Pass::Compiler2Pass()
	38	: mActiveTokenState(&mBNFTokenState)
	39	, mSource(0)
	40	, mSourceName("system")
	41	{
	42	// reserve some memory space in the containers being used
	43	mBNFTokenState.tokenQue.reserve(100);
	44	mBNFTokenState.lexemeTokenDefinitions.reserve(50);
	45
	46	initBNFCompiler();
	47	}
	48	//-----------------------------------------------------------------------
	49	void Compiler2Pass::initBNFCompiler(void)
	50	{
	51	if (mBNFTokenState.lexemeTokenDefinitions.empty())
	52	{
	53	addLexemeToken("UNKNOWN", BNF_UNKOWN);
	54	addLexemeToken("syntax", BNF_SYNTAX);
	55	addLexemeToken("rule", BNF_RULE);
	56	addLexemeToken("identifier", BNF_IDENTIFIER);
	57	addLexemeToken("identifier_right", BNF_IDENTIFIER_RIGHT);
	58	addLexemeToken("identifier_characters", BNF_IDENTIFIER_CHARACTERS);
	59	addLexemeToken("<", BNF_ID_BEGIN, false, true);
	60	addLexemeToken(">", BNF_ID_END, false, true);
	61	addLexemeToken("<#", BNF_CONSTANT_BEGIN, false, true);
	62	addLexemeToken("::=", BNF_SET_RULE, false, true);
	63	addLexemeToken("expression", BNF_EXPRESSION);
	64	addLexemeToken("and_term", BNF_AND_TERM);
	65	addLexemeToken("or_term", BNF_OR_TERM);
	66	addLexemeToken("term", BNF_TERM);
	67	addLexemeToken("term_id", BNF_TERM_ID);
	68	addLexemeToken("constant", BNF_CONSTANT);
	69	addLexemeToken("\|", BNF_OR, false, true);
	70	addLexemeToken("terminal_symbol", BNF_TERMINAL_SYMBOL);
	71	addLexemeToken("terminal_start", BNF_TERMINAL_START);
	72	addLexemeToken("repeat_expression", BNF_REPEAT_EXPRESSION);
	73	addLexemeToken("not_expression", BNF_NOT_EXPRESSION);
	74	addLexemeToken("{", BNF_REPEAT_BEGIN, false, true);
	75	addLexemeToken("}", BNF_REPEAT_END, false, true);
	76	addLexemeToken("set", BNF_SET);
	77	addLexemeToken("(", BNF_SET_BEGIN, false, true);
	78	addLexemeToken(")", BNF_SET_END, false, true);
	79	addLexemeToken("set_end_exc", BNF_SET_END_EXC);
	80	addLexemeToken("optional_expression", BNF_OPTIONAL_EXPRESSION);
	81	addLexemeToken("[", BNF_OPTIONAL_BEGIN, false, true);
	82	addLexemeToken("]", BNF_OPTIONAL_END, false, true);
	83	addLexemeToken("not_test", BNF_NOT_TEST);
	84	addLexemeToken("not_chk", BNF_NOT_CHK);
	85	addLexemeToken("(?!", BNF_NOT_TEST_BEGIN, false, true);
	86	addLexemeToken("'", BNF_SINGLEQUOTE, false, true);
	87	addLexemeToken("-'", BNF_NO_TOKEN_START, false, true);
	88	addLexemeToken("any_character", BNF_ANY_CHARACTER);
	89	addLexemeToken("single_quote_exc", BNF_SINGLE_QUOTE_EXC);
	90	addLexemeToken("white_space_chk", BNF_WHITE_SPACE_CHK);
	91	addLexemeToken("special_characters1", BNF_SPECIAL_CHARACTERS1);
	92	addLexemeToken("special_characters2", BNF_SPECIAL_CHARACTERS2);
	93
	94	addLexemeToken("letter", BNF_LETTER);
	95	addLexemeToken("letter_digit", BNF_LETTER_DIGIT);
	96	addLexemeToken("digit", BNF_DIGIT);
	97	addLexemeToken("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ", BNF_ALPHA_SET, false, true);
	98	addLexemeToken("0123456789", BNF_NUMBER_SET, false, true);
	99	addLexemeToken("`~!@#$%^&*(-_=+\\\|[]{}:;\"<>,.?/", BNF_SPECIAL_CHARACTER_SET2, false, true);
	100	addLexemeToken("$_", BNF_SPECIAL_CHARACTER_SET1, false, true);
	101	addLexemeToken(" ", BNF_WHITE_SPACE, false, true);
	102	addLexemeToken("?!", BNF_NOT_CHARS, false, true);
	103	}
	104
	105	if (mBNFTokenState.rootRulePath.empty())
	106	{
	107	// first entry is set to unknown in order to trap rule id's not set for non-terminal tokens
	108	mBNFTokenState.rootRulePath.resize(1);
	109	// used by bootstrap BNF text parser
	110	// <> - non-terminal token
	111	// () - set of
	112	// ::= - rule definition
	113	#define _rule_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otRULE, id));
	114	#define _is_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otAND, id));
	115	// - blank space is an implied "AND" meaning the token is required
	116	#define _and_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otAND, id));
	117	// \| - or
	118	#define _or_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otOR, id));
	119	// [] - optional
	120	#define _optional_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otOPTIONAL, id));
	121	// {} - repeat 0 or more times until fail or rule does not progress
	122	#define _repeat_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otREPEAT, id));
	123	#define _data_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otDATA, id));
	124	// (?! ) - lookahead negative (not test)
	125	#define _not_(id) mBNFTokenState.rootRulePath.push_back(TokenRule(otNOT_TEST, id));
	126	#define _end_ mBNFTokenState.rootRulePath.push_back(TokenRule(otEND,0));
	127
	128	// <syntax> ::= { rule }
	129	_rule_(BNF_SYNTAX) _repeat_(BNF_RULE) _end_
	130
	131	// <rule> ::= <identifier> "::=" <expression>
	132	_rule_(BNF_RULE)
	133	_is_(BNF_IDENTIFIER)
	134	_and_(BNF_SET_RULE)
	135	_and_(BNF_EXPRESSION)
	136	_end_
	137
	138	// <expression> ::= <and_term> { <or_term> }
	139	_rule_(BNF_EXPRESSION)
	140	_is_(BNF_AND_TERM)
	141	_repeat_(BNF_OR_TERM)
	142	_end_
	143	// <or_term> ::= "\|" <and_term>
	144	_rule_(BNF_OR_TERM)
	145	_is_(BNF_OR)
	146	_and_(BNF_AND_TERM)
	147	_end_
	148	// <and_term> ::= <term> { <term> }
	149	_rule_(BNF_AND_TERM)
	150	_is_(BNF_TERM)
	151	_repeat_(BNF_TERM)
	152	_end_
	153	// <term> ::= <term_id> \| <repeat_expression> \| <optional_expression> \| <not_expression>
	154	_rule_(BNF_TERM)
	155	_is_(BNF_TERM_ID)
	156	_or_(BNF_REPEAT_EXPRESSION)
	157	_or_(BNF_OPTIONAL_EXPRESSION)
	158	_or_(BNF_NOT_EXPRESSION)
	159	_end_
	160
	161	// <term_id> ::= <constant> \| <identifier_right> \| <terminal_symbol> \| <set>
	162	_rule_(BNF_TERM_ID)
	163	_is_(BNF_CONSTANT)
	164	_or_(BNF_IDENTIFIER_RIGHT)
	165	_or_(BNF_TERMINAL_SYMBOL)
	166	_or_(BNF_SET)
	167	_end_
	168
	169	// <repeat_expression> ::= "{" <term_id> "}"
	170	_rule_(BNF_REPEAT_EXPRESSION)
	171	_is_(BNF_REPEAT_BEGIN)
	172	_and_(BNF_TERM_ID)
	173	_and_(BNF_REPEAT_END)
	174	_end_
	175
	176	// <optional_expression> ::= "[" <term_id> "]"
	177	_rule_(BNF_OPTIONAL_EXPRESSION)
	178	_is_(BNF_OPTIONAL_BEGIN)
	179	_and_(BNF_TERM_ID)
	180	_and_(BNF_OPTIONAL_END)
	181	_end_
	182
	183	// <not_expression> ::= "(?!" <term_id> ")"
	184	_rule_(BNF_NOT_EXPRESSION)
	185	_is_(BNF_NOT_TEST_BEGIN)
	186	_and_(BNF_TERM_ID)
	187	_and_(BNF_SET_END)
	188	_end_
	189
	190	// <identifier_right> ::= <indentifier> (?!"::=")
	191	_rule_(BNF_IDENTIFIER_RIGHT)
	192	_is_(BNF_IDENTIFIER)
	193	_not_(BNF_SET_RULE)
	194	_end_
	195
	196	// <identifier> ::= "<" <letter> {<identifier_characters>} ">"
	197	_rule_(BNF_IDENTIFIER)
	198	_is_(BNF_ID_BEGIN)
	199	_and_(BNF_LETTER)
	200	_repeat_(BNF_IDENTIFIER_CHARACTERS)
	201	_and_(BNF_ID_END)
	202	_end_
	203
	204	// <identifier_characters> ::= <letter_digit> \| <special_characters1>
	205	_rule_(BNF_IDENTIFIER_CHARACTERS)
	206	_is_(BNF_LETTER_DIGIT)
	207	_or_(BNF_SPECIAL_CHARACTERS1)
	208	_end_
	209
	210	// <terminal_symbol> ::= <terminal_start> @{ <any_character> } "'"
	211	_rule_(BNF_TERMINAL_SYMBOL)
	212	_is_(BNF_TERMINAL_START)
	213	_and_(_no_space_skip_)
	214	_repeat_(BNF_ANY_CHARACTER)
	215	_and_(BNF_SINGLEQUOTE)
	216	_end_
	217
	218	// <terminal_start> ::= "-'" \| "'"
	219	_rule_(BNF_TERMINAL_START)
	220	_is_(BNF_NO_TOKEN_START)
	221	_or_(BNF_SINGLEQUOTE)
	222	_end_
	223
	224	// <constant> ::= "<#" <letter> {<identifier_characters>} ">"
	225	_rule_(BNF_CONSTANT)
	226	_is_(BNF_CONSTANT_BEGIN)
	227	_and_(BNF_LETTER)
	228	_repeat_(BNF_IDENTIFIER_CHARACTERS)
	229	_and_(BNF_ID_END)
	230	_end_
	231
	232	// <set> ::= "(" (?!<not_chk>) @{<any_character>} ")"
	233	_rule_(BNF_SET)
	234	_is_(BNF_SET_BEGIN)
	235	_not_(BNF_NOT_CHK)
	236	_and_(_no_space_skip_)
	237	_repeat_(BNF_ANY_CHARACTER)
	238	_and_(BNF_SET_END)
	239	_end_
	240
	241	// <any_character> ::= <letter_digit> \| <special_characters2>
	242	_rule_(BNF_ANY_CHARACTER)
	243	_is_(BNF_LETTER_DIGIT)
	244	_or_(BNF_SPECIAL_CHARACTERS2)
	245	_end_
	246
	247	// <letter_digit> ::= <letter> \| <digit>
	248	_rule_(BNF_LETTER_DIGIT)
	249	_is_(BNF_LETTER)
	250	_or_(BNF_DIGIT)
	251	_end_
	252
	253	// <letter> ::= (abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ)
	254	_rule_(BNF_LETTER)
	255	_is_(_character_)
	256	_data_(BNF_ALPHA_SET)// "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ_"
	257	_end_
	258
	259	// <digit> ::= (0123456789)
	260	_rule_(BNF_DIGIT)
	261	_is_(_character_)
	262	_data_(BNF_NUMBER_SET)
	263	_end_
	264
	265	// <special_characters1> ::= ($_)
	266	_rule_(BNF_SPECIAL_CHARACTERS1)
	267	_is_(_character_)
	268	_data_(BNF_SPECIAL_CHARACTER_SET1)
	269	_end_
	270
	271	// <special_characters2> ::= (`~!@#$%^&*(-_=+\\|[]{}:;"<>,.?/) \| <single_quote_exc>
	272	// \| <white_space_chk> \| <set_end_exc>
	273	_rule_(BNF_SPECIAL_CHARACTERS2)
	274	_is_(_character_)
	275	_data_(BNF_SPECIAL_CHARACTER_SET2)
	276	_or_(BNF_WHITE_SPACE_CHK)
	277	_or_(BNF_SINGLE_QUOTE_EXC)
	278	_or_(BNF_SET_END_EXC)
	279	_end_
	280
	281	// <single_quote_exc> ::= "'" (?!" ")
	282	_rule_(BNF_SINGLE_QUOTE_EXC)
	283	_is_(_character_)
	284	_data_(BNF_SINGLEQUOTE)
	285	_not_(BNF_WHITE_SPACE_CHK)
	286	_end_
	287
	288	// <set_end_exc> ::= ")" (?!" ")
	289	_rule_(BNF_SET_END_EXC)
	290	_is_(_character_)
	291	_data_(BNF_SET_END)
	292	_not_(BNF_WHITE_SPACE_CHK)
	293	_end_
	294
	295	// <white_space_chk> ::= ( )
	296	_rule_(BNF_WHITE_SPACE_CHK)
	297	_is_(_character_)
	298	_data_(BNF_WHITE_SPACE)
	299	_end_
	300	// <not_chk> ::= (?!)
	301	_rule_(BNF_NOT_CHK)
	302	_is_(_character_)
	303	_data_(BNF_NOT_CHARS)
	304	_end_
	305
	306	// now that all the rules are added, update token definitions with rule links
	307	verifyTokenRuleLinks("system");
	308	}
	309	// switch to client state
	310	mActiveTokenState = mClientTokenState;
	311	}
	312
	313	//-----------------------------------------------------------------------
	314	void Compiler2Pass::verifyTokenRuleLinks(const String& grammerName)
	315	{
	316	size_t token_ID;
	317
	318	// scan through all the rules and initialize index to rules for non-terminal tokens
	319	const size_t ruleCount = mActiveTokenState->rootRulePath.size();
	320	for (size_t i = 0; i < ruleCount; ++i)
	321	{
	322	// make sure token definition holds valid token
	323	if (mActiveTokenState->rootRulePath[i].operation == otRULE)
	324	{
	325	token_ID = mActiveTokenState->rootRulePath[i].tokenID;
	326	// system token id's can never have a rule assigned to them so no need to check if token is system token
	327	// but do make sure the id is within defined bounds
	328	if (token_ID >= mActiveTokenState->lexemeTokenDefinitions.size())
	329	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "For grammer: " + grammerName +
	330	", a token ID was out of token definition range.",
	331	"Compiler2Pass::verifyTokenRuleLinks");
	332
	333	LexemeTokenDef& tokenDef = mActiveTokenState->lexemeTokenDefinitions[token_ID];
	334	if (tokenDef.ID != token_ID)
	335	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "For grammer: " + grammerName +
	336	", lexeme non-terminal token definition: " +
	337	tokenDef.lexeme + " is corrupted and does not match its assigned rule.",
	338	"Compiler2Pass::verifyTokenRuleLinks");
	339	// if operation is a rule then update token definition
	340	tokenDef.ruleID = i;
	341	tokenDef.isNonTerminal = true;
	342	}
	343	} // end for
	344
	345	// test all non terminals for valid rule ID
	346	const size_t definitionCount = mActiveTokenState->lexemeTokenDefinitions.size();
	347	bool errorsFound = false;
	348	// report all non-terminals that don't have a rule then throw an exception
	349	for (token_ID = 0; token_ID < definitionCount; ++token_ID)
	350	{
	351	const LexemeTokenDef& tokenDef = mActiveTokenState->lexemeTokenDefinitions[token_ID];
	352	if (tokenDef.isNonTerminal && (tokenDef.ruleID == 0))
	353	{
	354	errorsFound = true;
	355	LogManager::getSingleton().logMessage(
	356	"For grammer: " + grammerName +
	357	", lexeme non-terminal token definition: " + tokenDef.lexeme +
	358	" found with no rule definition or corrupted."
	359	);
	360	}
	361	}
	362	if (errorsFound)
	363	{
	364	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "For grammer: " + grammerName +
	365	", lexeme non-terminal token definition(s) found with no rule definition or corrupted.",
	366	"Compiler2Pass::verifyTokenRuleLinks");
	367	}
	368	}
	369
	370	//-----------------------------------------------------------------------
	371	bool Compiler2Pass::compile(const String& source, const String& sourceName)
	372	{
	373	// make sure BNF compiler is setup to compile BNF grammer if required
	374	initBNFCompiler();
	375	// compile the client's BNF grammer
	376	setClientBNFGrammer();
	377
	378	bool Passed = false;
	379
	380	mSource = &source;
	381	mSourceName = sourceName;
	382	mActiveTokenState = mClientTokenState;
	383	// start compiling if there is a rule base to work with
	384	if (mActiveTokenState->rootRulePath.size() > 1)
	385	{
	386	Passed = doPass1();
	387
	388	if (Passed)
	389	{
	390	Passed = doPass2();
	391	}
	392	}
	393
	394	return Passed;
	395	}
	396
	397	//-----------------------------------------------------------------------
	398	bool Compiler2Pass::doPass1()
	399	{
	400	// scan through Source string and build a token list using TokenInstructions
	401	// this is a simple brute force lexical scanner/analyzer that also parses the formed
	402	// token for proper semantics and context in one pass
	403
	404	mCurrentLine = 1;
	405	mCharPos = 0;
	406	// reset position in Constants container
	407	mConstants.clear();
	408	mLabels.clear();
	409	// there is no active label when first starting pass 1
	410	mLabelIsActive = false;
	411	mActiveLabelKey = 0;
	412	mEndOfSource = mSource->length();
	413
	414	// start with a clean slate
	415	mActiveTokenState->tokenQue.clear();
	416	mPass2TokenQuePosition = 0;
	417	mPreviousActionQuePosition = 0;
	418	mNoTerminalToken = false;
	419	mNoSpaceSkip = false;
	420	// tokenize and check semantics untill an error occurs or end of source is reached
	421	// assume RootRulePath has pointer to rules so start at index + 1 for first rule path
	422	// first rule token would be a rule definition so skip over it
	423	bool passed = false;
	424
	425	try
	426	{
	427	passed = processRulePath(1);
	428	// if a lexeme in source still exists then the end of source was not reached and there was a problem some where
	429	if (positionToNextLexeme()) passed = false;
	430	if (passed)
	431	{
	432	// special condition at end of script. The last action needs to be triggered if
	433	// parsing reached the end of the source.
	434	activatePreviousTokenAction();
	435	}
	436
	437	}
	438	catch (Exception& e)
	439	{
	440	LogManager::getSingleton().logMessage( "Exception caught: "
	441	+ e.getFullDescription()
	442	+ ", while trying to parse: "
	443	+ getClientGrammerName()
	444	+ ": "
	445	+ mSourceName
	446	);
	447	}
	448	catch (...)
	449	{
	450	LogManager::getSingleton().logMessage( "Unkown exception while trying to parse: "
	451	+ getClientGrammerName()
	452	+ ": "
	453	+ mSourceName
	454	);
	455	}
	456
	457	return passed;
	458
	459	}
	460
	461	//-----------------------------------------------------------------------
	462	bool Compiler2Pass::doPass2()
	463	{
	464	bool passed = true;
	465	// step through tokens container and execute until end found or error occurs
	466
	467	return passed;
	468	}
	469
	470	//-----------------------------------------------------------------------
	471	const Compiler2Pass::TokenInst& Compiler2Pass::getNextToken(const size_t expectedTokenID)
	472	{
	473	//static TokenInst badToken;
	474	// advance instruction que index by one then get the current token instruction
	475	if (mPass2TokenQuePosition < mActiveTokenState->tokenQue.size() - 1)
	476	{
	477	++mPass2TokenQuePosition;
	478	const TokenInst& tokenInst = mActiveTokenState->tokenQue[mPass2TokenQuePosition];
	479	if (expectedTokenID > 0 && (tokenInst.tokenID != expectedTokenID))
	480	{
	481	OGRE_EXCEPT(Exception::ERR_ITEM_NOT_FOUND, getClientGrammerName() + ":" + mSourceName
	482	+ ", expected token ID not found" ,
	483	"Compiler2Pass::getNextToken");
	484	}
	485
	486	return tokenInst;
	487	}
	488	else
	489	// no more tokens left for pass 2 processing
	490	OGRE_EXCEPT(Exception::ERR_ITEM_NOT_FOUND, getClientGrammerName() + ":" + mSourceName
	491	+ ", no more tokens available for pass 2 processing" ,
	492	"Compiler2Pass::getNextToken");
	493	}
	494	//-----------------------------------------------------------------------
	495	const Compiler2Pass::TokenInst& Compiler2Pass::getCurrentToken(void)
	496	{
	497	if (mPass2TokenQuePosition < mActiveTokenState->tokenQue.size() - 1)
	498	return mActiveTokenState->tokenQue[mPass2TokenQuePosition];
	499	else
	500	OGRE_EXCEPT(Exception::ERR_ITEM_NOT_FOUND, getClientGrammerName() + ":" + mSourceName
	501	+ "no token available, all pass 2 tokens processed" ,
	502	"Compiler2Pass::getCurrentToken");
	503	}
	504	//-----------------------------------------------------------------------
	505	bool Compiler2Pass::testNextTokenID(const size_t expectedTokenID)
	506	{
	507	bool passed = false;
	508	const size_t nextTokenIndex = mPass2TokenQuePosition + 1;
	509	if (nextTokenIndex < mActiveTokenState->tokenQue.size() - 1)
	510	passed = mActiveTokenState->tokenQue[nextTokenIndex].tokenID == expectedTokenID;
	511
	512	return passed;
	513	}
	514	//-----------------------------------------------------------------------
	515	void Compiler2Pass::replaceToken(void)
	516	{
	517	// move instruction que index back one position
	518	if (mPass2TokenQuePosition > 0)
	519	--mPass2TokenQuePosition;
	520	}
	521	//-----------------------------------------------------------------------
	522	float Compiler2Pass::getNextTokenValue(void)
	523	{
	524	// get float value from current token instruction
	525	if (getNextToken().tokenID == _value_)
	526	return mConstants[mPass2TokenQuePosition];
	527	else
	528	{
	529	const TokenInst& token = getCurrentToken();
	530	// if token is not for a value then throw an exception
	531	OGRE_EXCEPT(Exception::ERR_ITEM_NOT_FOUND, "In " + mSourceName +
	532	", Line " + StringConverter::toString(token.line) +
	533	", token is not for a value. Found: >>>" + mSource->substr(token.pos, 20) +
	534	"<<<",
	535	"Compiler2Pass::getNextTokenValue");
	536	}
	537	}
	538	//-----------------------------------------------------------------------
	539	const String& Compiler2Pass::getNextTokenLabel(void)
	540	{
	541	// get label from current token instruction
	542	if (getNextToken().tokenID == _character_)
	543	return mLabels[mPass2TokenQuePosition];
	544	else
	545	{
	546	const TokenInst& token = getCurrentToken();
	547	// if token is not for a label then throw an exception
	548	OGRE_EXCEPT(Exception::ERR_ITEM_NOT_FOUND, "In " + mSourceName +
	549	", Line " + StringConverter::toString(token.line) +
	550	", token is not for a label. Found: >>>" + mSource->substr(token.pos, 20) +
	551	"<<<",
	552	"Compiler2Pass::getNextTokenLabel");
	553	}
	554	}
	555	//-----------------------------------------------------------------------
	556	size_t Compiler2Pass::getPass2TokenQueCount(void) const
	557	{
	558	// calculate number of tokens between current token instruction and next token with action
	559	if(mActiveTokenState->tokenQue.size() > mPass2TokenQuePosition)
	560	return mActiveTokenState->tokenQue.size() - 1 - mPass2TokenQuePosition;
	561	else
	562	return 0;
	563	}
	564	//-----------------------------------------------------------------------
	565	size_t Compiler2Pass::getRemainingTokensForAction(void) const
	566	{
	567	size_t remaingingTokens = getPass2TokenQueCount();
	568	// don't count token for next action
	569	if (remaingingTokens > 0)
	570	--remaingingTokens;
	571	return remaingingTokens;
	572	}
	573
	574	//-----------------------------------------------------------------------
	575	void Compiler2Pass::setClientBNFGrammer(void)
	576	{
	577	// switch to internal BNF Containers
	578	// clear client containers
	579	mClientTokenState = &mClientTokenStates[getClientGrammerName()];
	580	// attempt to compile the grammer into a rule base if no rules exist
	581	if (mClientTokenState->rootRulePath.size() == 0)
	582	{
	583	mClientTokenState->tokenQue.reserve(100);
	584	mClientTokenState->lexemeTokenDefinitions.reserve(100);
	585	// first entry in rule path is set as a bad entry and no token should reference it
	586	mClientTokenState->rootRulePath.resize(1);
	587	// allow the client to setup token definitions prior to
	588	// compiling the BNF grammer
	589	// ensure token definitions are added to the client state
	590	mActiveTokenState = mClientTokenState;
	591	// get client to setup token definitions and actions it wants to know about
	592	setupTokenDefinitions();
	593	// make sure active token state is for BNF compiling
	594	mActiveTokenState = &mBNFTokenState;
	595	mSource = &getClientBNFGrammer();
	596
	597	if (doPass1())
	598	{
	599	buildClientBNFRulePaths();
	600	}
	601	else
	602	{
	603	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "BNF Grammar compilation failed for " +
	604	getClientGrammerName(), "Compiler2Pass::setClientBNFGrammer");
	605	}
	606	// change token state to client data after compiling grammer
	607	mActiveTokenState = mClientTokenState;
	608	// verify the client rule paths and associated terminal and non-terminal lexemes
	609	verifyTokenRuleLinks(getClientGrammerName());
	610	}
	611	}
	612
	613	//-----------------------------------------------------------------------
	614	bool Compiler2Pass::processRulePath( size_t rulepathIDX)
	615	{
	616	// rule path determines what tokens and therefore what lexemes are acceptable from the source
	617	// it is assumed that the tokens with the longest similar lexemes are arranged first so
	618	// if a match is found it is accepted and no further searching is done
	619
	620	if (rulepathIDX >= mActiveTokenState->rootRulePath.size())
	621	{
	622	// This is very bad and no way to recover so raise exception
	623	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "rule ID exceeds rule base bounds.", "Compiler2Pass::processRulePath");
	624	}
	625	// record position of last token in container
	626	// to be used as the rollback position if a valid token is not found
	627	const size_t TokenContainerOldSize = mActiveTokenState->tokenQue.size();
	628	const size_t OldCharPos = mCharPos;
	629	const size_t OldLinePos = mCurrentLine;
	630	const bool OldLabelIsActive = mLabelIsActive;
	631	const size_t OldActiveLabelKey = mActiveLabelKey;
	632	const String OldLabel = mLabels[OldActiveLabelKey];
	633
	634	// keep track of what non-terminal token activated the rule
	635	size_t ActiveNTTRule = mActiveTokenState->rootRulePath[rulepathIDX].tokenID;
	636	// start rule path at next position for definition
	637	++rulepathIDX;
	638
	639	// assume the rule will pass
	640	bool passed = true;
	641	bool tokenFound = false;
	642	bool endFound = false;
	643	bool parseErrorLogged = false;
	644
	645	// keep following rulepath until the end is reached
	646	while (!endFound)
	647	{
	648	switch (mActiveTokenState->rootRulePath[rulepathIDX].operation)
	649	{
	650
	651	case otAND:
	652	// only validate if the previous rule passed
	653	if (passed)
	654	passed = ValidateToken(rulepathIDX, ActiveNTTRule);
	655	// log error message if a previouse token was found in this rule path and current token failed
	656	if (tokenFound && !parseErrorLogged && !passed)
	657	{
	658	parseErrorLogged = true;
	659	LogManager::getSingleton().logMessage(
	660	"*** ERROR in : " + getClientGrammerName() +
	661	"\nSource: " + mSourceName +
	662	"\nUnkown token found, was expecting: " + getBNFGrammerTextFromRulePath(rulepathIDX)
	663	);
	664	LogManager::getSingleton().logMessage(
	665	" Found: >>>" + mSource->substr(mCharPos, 20) +
	666	"<<<, while in rule path: <" + mActiveTokenState->lexemeTokenDefinitions[ActiveNTTRule].lexeme
	667	+ ">"
	668	);
	669	}
	670
	671	break;
	672
	673	case otOR:
	674	// only validate if the previous rule failed
	675	if ( passed == false )
	676	{
	677	// clear previous tokens from entry and try again
	678	mActiveTokenState->tokenQue.resize(TokenContainerOldSize);
	679	passed = ValidateToken(rulepathIDX, ActiveNTTRule);
	680	}
	681	else
	682	{
	683	// path passed up to this point therefore finished so pretend end marker found
	684	endFound = true;
	685	}
	686	break;
	687
	688	case otOPTIONAL:
	689	// if previous passed then try this rule but it does not effect succes of rule since its optional
	690	if(passed) ValidateToken(rulepathIDX, ActiveNTTRule);
	691	break;
	692
	693	case otREPEAT:
	694	// repeat until called rule fails or cursor does not advance
	695	// repeat is 0 or more times
	696	if (passed)
	697	{
	698	// keep calling until failure or no change in cursor position
	699	size_t prevPos = mCharPos;
	700	while ( ValidateToken(rulepathIDX, ActiveNTTRule))
	701	{
	702	if (mCharPos > prevPos)
	703	{
	704	prevPos = mCharPos;
	705	}
	706	else
	707	{
	708	// repeat failed to advance the cursor position so time to quit since the repeating rule
	709	// path isn't finding anything
	710	// this can happen if the rule being called only has _optional_ rules
	711	// this checking of the cursor positions prevents infinite loop from occuring
	712	break;
	713	}
	714	}
	715	}
	716	break;
	717
	718	case otDATA:
	719	// skip it, should have been handled by previous operation.
	720	break;
	721
	722	case otNOT_TEST:
	723	// only validate if the previous rule passed
	724	if (passed)
	725	{
	726
	727	// perform look ahead and test if rule production fails
	728	const size_t la_TokenContainerOldSize = mActiveTokenState->tokenQue.size();
	729	const size_t la_OldCharPos = mCharPos;
	730	const size_t la_OldLinePos = mCurrentLine;
	731	const bool la_OldLabelIsActive = mLabelIsActive;
	732	const size_t la_OldActiveLabelKey = mActiveLabelKey;
	733	const String la_OldLabel = mLabels[la_OldActiveLabelKey];
	734
	735	passed = !ValidateToken(rulepathIDX, ActiveNTTRule);
	736
	737	// only wanted to take a peek as to what was ahead so now restore back to current position
	738	mActiveTokenState->tokenQue.resize(la_TokenContainerOldSize);
	739	mCharPos = la_OldCharPos;
	740	mCurrentLine = la_OldLinePos;
	741	// restor label state if it was active before not test
	742	if (la_OldLabelIsActive)
	743	{
	744	mActiveLabelKey = la_OldActiveLabelKey;
	745	mLabels[la_OldActiveLabelKey] = la_OldLabel;
	746	mLabelIsActive = la_OldLabelIsActive;
	747	}
	748	// only perform full rollback if tokens found
	749	if (!passed)
	750	{
	751	// the rule did not validate so get rid of tokens decoded
	752	// roll back the token container end position to what it was when rule started
	753	// this will get rid of all tokens that had been pushed on the container while
	754	// trying to validating this rule
	755	mActiveTokenState->tokenQue.resize(TokenContainerOldSize);
	756	//mConstants.resize(OldConstantsSize);
	757	mCharPos = OldCharPos;
	758	mCurrentLine = OldLinePos;
	759	// restor label state if it was active before not test
	760	if (OldLabelIsActive)
	761	{
	762	mActiveLabelKey = OldActiveLabelKey;
	763	mLabels[OldActiveLabelKey] = OldLabel;
	764	mLabelIsActive = OldLabelIsActive;
	765	}
	766
	767	// terminate rule production processing
	768	endFound = true;
	769	}
	770	}
	771	break;
	772
	773	case otEND:
	774	// end of rule found so time to return
	775	endFound = true;
	776	// only rollback if no tokens found
	777	if (!passed && !tokenFound)
	778	{
	779	// the rule did not validate so get rid of tokens decoded
	780	// roll back the token container end position to what it was when rule started
	781	// this will get rid of all tokens that had been pushed on the container while
	782	// trying to validating this rule
	783	mActiveTokenState->tokenQue.resize(TokenContainerOldSize);
	784	//mConstants.resize(OldConstantsSize);
	785	mCharPos = OldCharPos;
	786	mCurrentLine = OldLinePos;
	787	}
	788	else
	789	{
	790	// if the rule path was partially completed, one or more tokeks found, then put a
	791	// warning in the log
	792	if (!passed && tokenFound && !mLabelIsActive)
	793	{
	794	passed = true;
	795	// log last valid token found
	796	const TokenInst& tokenInst = mActiveTokenState->tokenQue[mActiveTokenState->tokenQue.size() - 1];
	797	LogManager::getSingleton().logMessage(
	798	"Last valid token found was at line: " + StringConverter::toString(tokenInst.line));
	799	LogManager::getSingleton().logMessage(
	800	"source hint: >>>" + mSource->substr(tokenInst.pos, 20) + "<<<");
	801	}
	802	}
	803	break;
	804
	805	default:
	806	// an exception should be raised since the code should never get here
	807	passed = false;
	808	endFound = true;
	809	break;
	810
	811	} // end switch
	812	// prevent rollback from occuring if a token was found but later part of rule fails
	813	// this allows pass2 to either fix the problem or report the error and continue on.
	814	// Don't do this for _no_token_ since its a special system token and has nothing todo with
	815	// a successfull parse of the source. Can check this by looking at mNoTerminalToken state.
	816	// if _no_token had just been validated then mNoTerminalToken will be true.
	817	if (passed && !mNoTerminalToken)
	818	tokenFound = true;
	819	// move on to the next rule in the path
	820	++rulepathIDX;
	821	} // end while
	822
	823	return passed;
	824	}
	825
	826	//-----------------------------------------------------------------------
	827	bool Compiler2Pass::isCharacterLabel(const size_t rulepathIDX)
	828	{
	829	// assume the test is going to fail
	830	bool Passed = false;
	831
	832	// get token from next rule operation
	833	// token string is list of valid single characters
	834	// compare character at current cursor position in script to characters in list for a match
	835	// if match found then add character to active label
	836	// _character_ will not have a token definition but the next rule operation should be
	837	// DATA and have the token ID required to get the character set.
	838	const TokenRule& rule = mActiveTokenState->rootRulePath[rulepathIDX + 1];
	839	if (rule.operation == otDATA)
	840	{
	841	const size_t TokenID = rule.tokenID;
	842	if (mActiveTokenState->lexemeTokenDefinitions[TokenID].lexeme.find((*mSource)[mCharPos]) != String::npos)
	843	{
	844	// is a new label starting?
	845	// if mLabelIsActive is false then starting a new label so need a new mActiveLabelKey
	846	if (!mLabelIsActive)
	847	{
	848	// mActiveLabelKey will be the end of the instruction container ie the size of mTokenInstructions
	849	mActiveLabelKey = mActiveTokenState->tokenQue.size();
	850	mLabelIsActive = true;
	851	mNoSpaceSkip = true;
	852	// reset the contents of the label since it might have been used prior to a rollback
	853	mLabels[mActiveLabelKey] = "";
	854	}
	855	// add the single character to the end of the active label
	856	mLabels[mActiveLabelKey] += (*mSource)[mCharPos];
	857	Passed = true;
	858	}
	859	}
	860
	861	return Passed;
	862	}
	863	//-----------------------------------------------------------------------
	864	bool Compiler2Pass::ValidateToken(const size_t rulepathIDX, const size_t activeRuleID)
	865	{
	866	size_t tokenlength = 0;
	867	// assume the test is going to fail
	868	bool Passed = false;
	869	size_t tokenID = mActiveTokenState->rootRulePath[rulepathIDX].tokenID;
	870	// if terminal token then compare text of lexeme with what is in source
	871	if ( (tokenID >= SystemTokenBase) \|\|
	872	!mActiveTokenState->lexemeTokenDefinitions[tokenID].isNonTerminal )
	873	{
	874	if (tokenID != _character_)
	875	{
	876	mLabelIsActive = false;
	877	// allow spaces to be skipped for next lexeme processing
	878	mNoSpaceSkip = false;
	879	}
	880
	881	if (tokenID == _no_space_skip_)
	882	{
	883	// don't skip spaces to get to next lexeme
	884	mNoSpaceSkip = true;
	885	// move on to next rule
	886	Passed = true;
	887	}
	888	else if (tokenID == _no_token_)
	889	{
	890	// turn on no terminal token processing for next rule
	891	mNoTerminalToken = true;
	892	// move on to next rule
	893	Passed = true;
	894	}
	895	// if label processing is active ie previous token was _character_
	896	// and current token is supposed to be a _character_ then don't
	897	// position to next lexeme in source
	898	else if (mNoSpaceSkip \|\| positionToNextLexeme())
	899	{
	900	// if Token is supposed to be a number then check if its a numerical constant
	901	if (tokenID == _value_)
	902	{
	903	float constantvalue = 0.0f;
	904	if (Passed = isFloatValue(constantvalue, tokenlength))
	905	{
	906	// key is the next instruction index
	907	mConstants[mActiveTokenState->tokenQue.size()] = constantvalue;
	908	}
	909	}
	910	else // check if user label or valid keyword token
	911	{
	912	if (tokenID == _character_)
	913	{
	914	if (Passed = isCharacterLabel(rulepathIDX))
	915	// only one character was processed
	916	tokenlength = 1;
	917	}
	918	else
	919	{
	920
	921	// compare token lexeme text with source text
	922	if (Passed = isLexemeMatch(mActiveTokenState->lexemeTokenDefinitions[tokenID].lexeme, mActiveTokenState->lexemeTokenDefinitions[tokenID].isCaseSensitive))
	923	{
	924	tokenlength = mActiveTokenState->lexemeTokenDefinitions[tokenID].lexeme.length();
	925	// check if terminal token should be ignored ie not put in instruction que
	926	if (mNoTerminalToken)
	927	tokenID = _no_token_;
	928	}
	929	// always clear no terminal token flag. it only works for one pending terminal token.
	930	mNoTerminalToken = false;
	931	}
	932	}
	933
	934	// turn off label processing if token ID was not for _character_
	935	if (tokenID == _character_)
	936	{
	937	// _character_ token being processed
	938	// turn off generation of a new token instruction if this is not
	939	// the first _character_ in a sequence of _character_ terminal tokens.
	940	// Only want one _character_ token which Identifies a label
	941
	942	if (mActiveTokenState->tokenQue.size() > mActiveLabelKey)
	943	{
	944	// this token is not the first _character_ in the label sequence
	945	// so turn off the token by turning TokenID into _no_token_
	946	tokenID = _no_token_;
	947	}
	948	}
	949
	950	// if valid terminal token was found then add it to the instruction container for pass 2 processing
	951	if (Passed)
	952	{
	953	if (tokenID != _no_token_)
	954	{
	955	TokenInst newtoken;
	956	// push token onto end of container
	957	newtoken.tokenID = tokenID;
	958	newtoken.NTTRuleID = activeRuleID;
	959	newtoken.line = mCurrentLine;
	960	newtoken.pos = mCharPos;
	961	newtoken.found = true;
	962
	963	mActiveTokenState->tokenQue.push_back(newtoken);
	964	// token action processing
	965	// if the token has an action then fire previous token action
	966	checkTokenActionTrigger();
	967	}
	968
	969	// update source position
	970	mCharPos += tokenlength;
	971	} // end if
	972	} // end else if
	973
	974	}
	975	// else a non terminal token was found
	976	else
	977	{
	978	// execute rule for non-terminal
	979	// get rule_ID for index into rulepath to be called
	980	Passed = processRulePath(mActiveTokenState->lexemeTokenDefinitions[tokenID].ruleID);
	981	}
	982
	983	return Passed;
	984	}
	985
	986	//-----------------------------------------------------------------------
	987	bool Compiler2Pass::isFloatValue(float& fvalue, size_t& charsize) const
	988	{
	989	// check to see if it is a numeric float value
	990	bool valuefound = false;
	991
	992	const char* startptr = mSource->c_str() + mCharPos;
	993	char* endptr = NULL;
	994
	995	fvalue = (float)strtod(startptr, &endptr);
	996	// if a valid float was found then endptr will have the pointer to the first invalid character
	997	if (endptr)
	998	{
	999	if (endptr>startptr)
	1000	{
	1001	// a valid value was found so process it
	1002	charsize = endptr - startptr;
	1003	valuefound = true;
	1004	}
	1005	}
	1006
	1007	return valuefound;
	1008	}
	1009
	1010	//-----------------------------------------------------------------------
	1011	bool Compiler2Pass::isLexemeMatch(const String& lexeme, const bool caseSensitive) const
	1012	{
	1013	// compare text at source+charpos with the lexeme : limit testing to lexeme size
	1014	if (!caseSensitive)
	1015	{
	1016	String testItem = mSource->substr(mCharPos, lexeme.length());
	1017	StringUtil::toLowerCase(testItem);
	1018	return (testItem.compare(lexeme) == 0);
	1019	}
	1020	else
	1021	{
	1022	return (mSource->compare(mCharPos, lexeme.length(), lexeme) == 0);
	1023	}
	1024	}
	1025
	1026	//-----------------------------------------------------------------------
	1027	bool Compiler2Pass::positionToNextLexeme()
	1028	{
	1029	bool validlexemefound = false;
	1030	bool endofsource = mCharPos >= mEndOfSource;
	1031
	1032	while (!validlexemefound && !endofsource)
	1033	{
	1034	skipWhiteSpace();
	1035	skipEOL();
	1036	skipComments();
	1037	// have we reached the end of the string?
	1038	if (mCharPos >= mEndOfSource)
	1039	endofsource = true;
	1040	else
	1041	{
	1042	// if ASCII > space then assume valid character is found
	1043	if ((*mSource)[mCharPos] > ' ') validlexemefound = true;
	1044	}
	1045	}// end of while
	1046
	1047	return validlexemefound;
	1048	}
	1049
	1050	//-----------------------------------------------------------------------
	1051	void Compiler2Pass::skipComments()
	1052	{
	1053	if (mCharPos >= mEndOfSource)
	1054	return;
	1055	// if current char and next are // then search for EOL
	1056	if (mSource->compare(mCharPos, 2, "//") == 0)
	1057	findEOL();
	1058	}
	1059
	1060	//-----------------------------------------------------------------------
	1061	void Compiler2Pass::findEOL()
	1062	{
	1063	if (mCharPos >= mEndOfSource)
	1064	return;
	1065	// find eol charter and move to this position
	1066	mCharPos = mSource->find('\n', mCharPos);
	1067	}
	1068
	1069	//-----------------------------------------------------------------------
	1070	void Compiler2Pass::skipEOL()
	1071	{
	1072	if (mCharPos >= mEndOfSource)
	1073	return;
	1074
	1075	if (((mSource)[mCharPos] == '\n') \|\| ((mSource)[mCharPos] == '\r'))
	1076	{
	1077	mCurrentLine++;
	1078	mCharPos++;
	1079	if (mCharPos >= mEndOfSource)
	1080	return;
	1081	if (((mSource)[mCharPos] == '\n') \|\| ((mSource)[mCharPos] == '\r'))
	1082	{
	1083	mCharPos++;
	1084	}
	1085	}
	1086	}
	1087
	1088	//-----------------------------------------------------------------------
	1089	void Compiler2Pass::skipWhiteSpace()
	1090	{
	1091	if (mCharPos >= mEndOfSource)
	1092	return;
	1093
	1094	mCharPos = mSource->find_first_not_of(" \t", mCharPos);
	1095	}
	1096
	1097	//-----------------------------------------------------------------------
	1098	void Compiler2Pass::addLexemeToken(const String& lexeme, const size_t token, const bool hasAction, const bool caseSensitive)
	1099	{
	1100	if (token >= mActiveTokenState->lexemeTokenDefinitions.size())
	1101	mActiveTokenState->lexemeTokenDefinitions.resize(token + 1);
	1102	// since resizing guarentees the token definition will exist, just assign values to members
	1103	LexemeTokenDef& tokenDef = mActiveTokenState->lexemeTokenDefinitions[token];
	1104	if (tokenDef.ID != 0)
	1105	{
	1106	OGRE_EXCEPT(Exception::ERR_DUPLICATE_ITEM, "In " + getClientGrammerName() +
	1107	", lexeme >>>" +
	1108	lexeme + "<<< already exists in lexeme token definitions",
	1109	"Compiler2Pass::addLexemeToken");
	1110	}
	1111	tokenDef.ID = token;
	1112	tokenDef.lexeme = lexeme;
	1113	if (!caseSensitive)
	1114	StringUtil::toLowerCase(tokenDef.lexeme);
	1115	tokenDef.hasAction = hasAction;
	1116	tokenDef.isCaseSensitive = caseSensitive;
	1117
	1118	mActiveTokenState->lexemeTokenMap[lexeme] = token;
	1119	}
	1120
	1121	//-----------------------------------------------------------------------
	1122	void Compiler2Pass::checkTokenActionTrigger(void)
	1123	{
	1124	size_t lastTokenQuePos = mActiveTokenState->tokenQue.size();
	1125	// if there are no token instructions in the que then there is nothing todo
	1126	if (lastTokenQuePos == 0)
	1127	return;
	1128
	1129	--lastTokenQuePos;
	1130	// if last token index is zero and previous action position are zero or the two are the same then do nothing
	1131	if (lastTokenQuePos == mPreviousActionQuePosition)
	1132	return;
	1133
	1134	const size_t lastTokenID = mActiveTokenState->tokenQue.at(lastTokenQuePos).tokenID;
	1135	// dont check actions for system token ID since they are not in lexemeTokenDefinitions
	1136	if (lastTokenID >= SystemTokenBase)
	1137	return;
	1138
	1139	// check action trigger if last token has an action
	1140	if (mActiveTokenState->lexemeTokenDefinitions.at(lastTokenID).hasAction)
	1141	{
	1142	// only activate the action belonging to the token found previously
	1143	activatePreviousTokenAction();
	1144	// current token action now becomes the previous one
	1145	mPreviousActionQuePosition = lastTokenQuePos;
	1146	}
	1147	}
	1148
	1149	//-----------------------------------------------------------------------
	1150	String Compiler2Pass::getBNFGrammerTextFromRulePath(size_t ruleID)
	1151	{
	1152
	1153	String grammerText;
	1154
	1155	// default to using Client rule path
	1156	// check if index is inbounds
	1157	if (ruleID >= mActiveTokenState->rootRulePath.size())
	1158	{
	1159	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "rule ID exceeds client rule path bounds.", "Compiler2Pass::getBNFGrammerRulePathText");
	1160	}
	1161	// iterate through rule path and get terminal and non-terminal strings
	1162	const TokenRuleContainer& rulePath = mActiveTokenState->rootRulePath;
	1163
	1164	while (rulePath[ruleID].operation != otEND)
	1165	{
	1166	// rule text processing - the op instructions, system tokens
	1167	switch (rulePath[ruleID].operation)
	1168	{
	1169	// rule lexeme ::=
	1170	case otRULE:
	1171	grammerText += "\n" + getLexemeText(ruleID) + " ::=";
	1172	break;
	1173	// no special processing for AND op
	1174	case otAND:
	1175	grammerText += " " + getLexemeText(ruleID);
	1176	break;
	1177	// or \| lexeme
	1178	case otOR:
	1179	grammerText += " \| " + getLexemeText(ruleID);
	1180	break;
	1181	// optional [lexeme]
	1182	case otOPTIONAL:
	1183	grammerText += " [" + getLexemeText(ruleID) + "]";
	1184	break;
	1185	// repeat {lexeme}
	1186	case otREPEAT:
	1187	grammerText += " {" + getLexemeText(ruleID) + "}";
	1188	break;
	1189	// not test (?!lexeme)
	1190	case otNOT_TEST:
	1191	grammerText += " (?!" + getLexemeText(ruleID) + ")";
	1192	break;
	1193	}
	1194	// lexeme/token text procesing
	1195	++ruleID;
	1196	}
	1197
	1198	return grammerText;
	1199	}
	1200
	1201	//-----------------------------------------------------------------------
	1202
	1203	//-----------------------------------------------------------------------
	1204	// Private Methods
	1205	//-----------------------------------------------------------------------
	1206	//-----------------------------------------------------------------------
	1207	String Compiler2Pass::getLexemeText(size_t& ruleID)
	1208	{
	1209	if (ruleID >= mActiveTokenState->rootRulePath.size())
	1210	{
	1211	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR,
	1212	"rule ID exceeds client rule path bounds.", "Compiler2Pass::getLexemeText"
	1213	);
	1214	}
	1215
	1216	String lexeme;
	1217
	1218	const TokenRuleContainer& rulePath = mActiveTokenState->rootRulePath;
	1219	const size_t tokenID = rulePath[ruleID].tokenID;
	1220
	1221	if ( tokenID < SystemTokenBase)
	1222	{
	1223	// non-terminal tokens
	1224	if (mActiveTokenState->lexemeTokenDefinitions[tokenID].isNonTerminal)
	1225	{
	1226	lexeme = "<" + mActiveTokenState->lexemeTokenDefinitions[tokenID].lexeme + ">";
	1227	}
	1228	else // terminal tokens
	1229	{
	1230	lexeme = "'" + mActiveTokenState->lexemeTokenDefinitions[tokenID].lexeme + "'";
	1231	}
	1232	}
	1233	else // system token processing
	1234	{
	1235	switch (rulePath[ruleID].tokenID)
	1236	{
	1237	case _character_:
	1238	// need to get next rule instruction for data
	1239	++ruleID;
	1240	// data for _character_ is always a set so put () around text string
	1241	lexeme = "{" + mActiveTokenState->lexemeTokenDefinitions[rulePath[ruleID].tokenID].lexeme + ")";
	1242	break;
	1243	case _value_:
	1244	// <#> - need name of label?
	1245	lexeme = "<#>";
	1246	break;
	1247	}
	1248	}
	1249
	1250	return lexeme;
	1251	}
	1252	//-----------------------------------------------------------------------
	1253	void Compiler2Pass::activatePreviousTokenAction(void)
	1254	{
	1255	const size_t previousTokenID = mActiveTokenState->tokenQue.at(mPreviousActionQuePosition).tokenID;
	1256	const LexemeTokenDef& tokenDef = mActiveTokenState->lexemeTokenDefinitions.at(previousTokenID);
	1257	if (tokenDef.hasAction)
	1258	{
	1259	// set the current pass 2 token que position to previous action que position
	1260	// assume that pass 2 processing will use tokens downstream
	1261	mPass2TokenQuePosition = mPreviousActionQuePosition;
	1262	executeTokenAction(previousTokenID);
	1263	}
	1264	}
	1265	//-----------------------------------------------------------------------
	1266	void Compiler2Pass::buildClientBNFRulePaths(void)
	1267	{
	1268	bool isFirstToken = true;
	1269	OperationType pendingRuleOp = otAND;
	1270
	1271	// convert tokens in BNF token que to rule paths
	1272	while (getPass2TokenQueCount() > 0)
	1273	{
	1274	// get a pass 2 token
	1275	// if this is the first time getting a token then get the current token
	1276	const TokenInst& currentToken = isFirstToken ? getCurrentToken() : getNextToken();
	1277	isFirstToken = false;
	1278	// only process the token if its valid
	1279	if (currentToken.found)
	1280	{
	1281	// a valid token has been found, convert to a rule
	1282	switch (currentToken.tokenID)
	1283	{
	1284	case BNF_ID_BEGIN: // <
	1285	extractNonTerminal(pendingRuleOp);
	1286	pendingRuleOp = otAND;
	1287	break;
	1288
	1289
	1290	case BNF_CONSTANT_BEGIN: // <#
	1291	extractNumericConstant(pendingRuleOp);
	1292	pendingRuleOp = otAND;
	1293	break;
	1294
	1295	case BNF_OR: // \|
	1296	pendingRuleOp = otOR;
	1297	break;
	1298
	1299	case BNF_REPEAT_BEGIN: // {
	1300	pendingRuleOp = otREPEAT;
	1301	break;
	1302
	1303	case BNF_NO_TOKEN_START: // '
	1304	extractTerminal(pendingRuleOp, true);
	1305	pendingRuleOp = otAND;
	1306	break;
	1307
	1308	case BNF_SINGLEQUOTE: // '
	1309	extractTerminal(pendingRuleOp);
	1310	pendingRuleOp = otAND;
	1311	break;
	1312
	1313	case BNF_OPTIONAL_BEGIN: // [
	1314	pendingRuleOp = otOPTIONAL;
	1315	break;
	1316
	1317	case BNF_NOT_TEST_BEGIN: // (?!
	1318	pendingRuleOp = otNOT_TEST;
	1319	break;
	1320
	1321	case BNF_SET_BEGIN: // (
	1322	extractSet(pendingRuleOp);
	1323	pendingRuleOp = otAND;
	1324	break;
	1325
	1326	default:
	1327	// trap closings ie ] } )
	1328	break;
	1329	} // end switch
	1330	} // end if
	1331	} // end while
	1332	}
	1333
	1334	//-----------------------------------------------------------------------
	1335	void Compiler2Pass::modifyLastRule(const OperationType pendingRuleOp, const size_t tokenID)
	1336	{
	1337	// add operation using this token ID to the current rule expression
	1338	size_t lastIndex = mClientTokenState->rootRulePath.size();
	1339	if (lastIndex == 0)
	1340	{
	1341	// throw exception since there should have been at least one rule existing
	1342	OGRE_EXCEPT(Exception::ERR_INTERNAL_ERROR, "BNF Grammar build rules failed: no previous rule op defined", "Compiler2Pass::modifyLastRule");
	1343	}
	1344	--lastIndex;
	1345	mClientTokenState->rootRulePath[lastIndex].operation = pendingRuleOp;
	1346	mClientTokenState->rootRulePath[lastIndex].tokenID = tokenID;
	1347	// add new end op token rule
	1348	mClientTokenState->rootRulePath.push_back(TokenRule(otEND, 0));
	1349	}
	1350
	1351	//-----------------------------------------------------------------------
	1352	size_t Compiler2Pass::getClientLexemeTokenID(const String& lexeme, const bool isCaseSensitive)
	1353	{
	1354	size_t tokenID = mClientTokenState->lexemeTokenMap[lexeme];
	1355
	1356	if (tokenID == 0)
	1357	{
	1358	// lexeme not found so a new entry is made by the system
	1359	// note that all lexemes added by the system will not/can not have an action
	1360	tokenID = mClientTokenState->lexemeTokenDefinitions.size();
	1361	// add identifier to client lexeme tokens
	1362	mActiveTokenState = mClientTokenState;
	1363	addLexemeToken(lexeme, tokenID, false, isCaseSensitive);
	1364	mActiveTokenState = &mBNFTokenState;
	1365	}
	1366
	1367	return tokenID;
	1368	}
	1369	//-----------------------------------------------------------------------
	1370	void Compiler2Pass::extractNonTerminal(const OperationType pendingRuleOp)
	1371	{
	1372	// begining of identifier
	1373	// next token should be for a label
	1374	const String& identifierLabel = getNextTokenLabel();
	1375	// next token should be id end
	1376	getNextToken(BNF_ID_END);
	1377	// add identifier to lexeme token definitions but keep case sensitivity
	1378	const size_t tokenID = getClientLexemeTokenID(identifierLabel, true);
	1379	LexemeTokenDef& tokenDef = mClientTokenState->lexemeTokenDefinitions[tokenID];
	1380
	1381	// peek at the next token isntruction to see if this
	1382	// identifier is for a new rule or is part of the current rule
	1383	if (testNextTokenID(BNF_SET_RULE))
	1384	{
	1385	// consume set rule
	1386	getNextToken(BNF_SET_RULE);
	1387	// check to make sure this is the first time this rule is being setup by
	1388	// verifying rule id is 0
	1389	if (tokenDef.ruleID != 0)
	1390	{
	1391	// this is not the first time for this identifier to be set up as a rule
	1392	// since duplicate rules can not exist, throw an exception
	1393	OGRE_EXCEPT(Exception::ERR_DUPLICATE_ITEM, "while parsing BNF grammer for: " +
	1394	getClientGrammerName() +
	1395	", an attempt was made to assign a rule to identifier: " +
	1396	tokenDef.lexeme + ", that already had a rule assigned",
	1397	"Compiler2Pass::extractNonTerminal");
	1398	}
	1399	// add new rule to end of rule path
	1400	mClientTokenState->rootRulePath.push_back(TokenRule(otRULE, tokenID));
	1401	tokenDef.ruleID = mClientTokenState->rootRulePath.size() - 1;
	1402	// add new end op token rule
	1403	mClientTokenState->rootRulePath.push_back(TokenRule(otEND, 0));
	1404	}
	1405	else // just a reference to a non-terminal
	1406	{
	1407	modifyLastRule(pendingRuleOp, tokenID);
	1408	}
	1409
	1410	tokenDef.isNonTerminal = true;
	1411	}
	1412	//-----------------------------------------------------------------------
	1413	void Compiler2Pass::extractTerminal(const OperationType pendingRuleOp, const bool notoken)
	1414	{
	1415	// begining of label
	1416	// next token should be for a label
	1417	const String& terminalLabel = getNextTokenLabel();
	1418	// next token should be single quote end
	1419	getNextToken(BNF_SINGLEQUOTE);
	1420	// add terminal to lexeme token definitions
	1421	// note that if label not in the map it is automatically added
	1422	const size_t tokenID = getClientLexemeTokenID(terminalLabel);
	1423	if (notoken)
	1424	modifyLastRule(otAND, _no_token_);
	1425	modifyLastRule(pendingRuleOp, tokenID);
	1426	}
	1427	//-----------------------------------------------------------------------
	1428	void Compiler2Pass::extractSet(const OperationType pendingRuleOp)
	1429	{
	1430	const String& setLabel = getNextTokenLabel();
	1431	// next token should be )
	1432	getNextToken(BNF_SET_END);
	1433	// add set to lexeme token definitions but keep case sensitivity
	1434	const size_t tokenID = getClientLexemeTokenID(setLabel, true);
	1435	// add operation using this token ID to the current rule expression
	1436	modifyLastRule(pendingRuleOp, _character_);
	1437	// add the data required by the character lookup operation
	1438	modifyLastRule(otDATA, tokenID);
	1439	}
	1440	//-----------------------------------------------------------------------
	1441	void Compiler2Pass::extractNumericConstant(const OperationType pendingRuleOp)
	1442	{
	1443	// consume label for constant, don't need it for anything
	1444	getNextTokenLabel();
	1445
	1446	getNextToken(BNF_ID_END); // >
	1447	// add operation using this token ID to the current rule expression
	1448	modifyLastRule(pendingRuleOp, _value_);
	1449	}
	1450
	1451
	1452	}

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: OGRE/trunk/ogrenew/OgreMain/src/OgreCompiler2Pass.cpp @ 692

Download in other formats: