From 247904a84430b8c9151fa6afb68f01b60afb92c9 Mon Sep 17 00:00:00 2001 From: Adrian Thurston Date: Sun, 1 Jul 2012 12:48:22 -0400 Subject: moved 'colm' dir to 'src' --- src/lmparse.kh | 120 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 120 insertions(+) create mode 100644 src/lmparse.kh (limited to 'src/lmparse.kh') diff --git a/src/lmparse.kh b/src/lmparse.kh new file mode 100644 index 00000000..86b70b6f --- /dev/null +++ b/src/lmparse.kh @@ -0,0 +1,120 @@ +/* + * Copyright 2001-2007 Adrian Thurston + */ + +/* This file is part of Colm. + * + * Colm is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * Colm is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with Colm; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#ifndef RLPARSE_H +#define RLPARSE_H + +#include +#include "avltree.h" +#include "parsedata.h" + +#define PROPERTY_REDUCE_FIRST 0x1 + +struct ColmParser +{ + ColmParser( Compiler *pd, const char *fileName, const char *sectionName, const InputLoc §ionLoc ) + : pd(pd), sectionName(sectionName), enterRl(false) + {} + + %%{ + parser ColmParser; + + # Use a class for tokens. + token uses class Token; + + # Atoms. + token TK_Word, TK_Literal, TK_SingleLit, TK_DoubleLit, TK_Number, TK_UInt, + TK_Hex, KW_Nil, KW_True, KW_False; + + # General tokens. + token TK_DotDot, TK_ColonGt, TK_ColonGtGt, TK_LtColon, + TK_DoubleArrow, TK_StarStar, TK_NameSep, TK_DashDash, TK_DoubleEql, + TK_NotEql, TK_DoubleColon, TK_LessEql, TK_GrtrEql, TK_RightArrow, + TK_LitPat, TK_AmpAmp, TK_BarBar, TK_SqOpen, TK_SqOpenNeg, TK_SqClose, + TK_Dash, TK_ReChar, TK_LtLt; + + # Defining things. + token KW_Rl, KW_Def, KW_Lex, KW_Context, KW_Ignore, KW_Token, KW_Commit, KW_Namespace, + KW_Literal, KW_ReduceFirst, KW_Map, KW_List, KW_Vector, KW_Accum, KW_Global, KW_Export, + KW_Iter, KW_Reject, KW_Ptr, KW_Ref, KW_Deref; + + # Language. + token KW_If, KW_While, KW_Else, KW_Elsif, KW_For, KW_Return, KW_Yield, KW_In, + KW_Break, KW_PrintXMLAC, KW_PrintXML, KW_Print, KW_PrintStream, KW_Require; + + # Patterns. + token KW_Match, KW_Construct, KW_Parse, KW_ParseStop, KW_New, KW_MakeToken, + KW_MakeTree, KW_TypeId, KW_Alias, KW_Send, KW_Ni, KW_Ci; + + token KW_Include, KW_Preeof; + + token KW_Left, KW_Right, KW_Nonassoc, KW_Prec; + + }%% + + %% write instance_data; + + + void init(); + int parseLangEl( int type, const Token *token ); + + int token( InputLoc &loc, int tokId, char *tokstart, int toklen ); + void addRegularDef( const InputLoc &loc, Namespace *nspace, + const String &name, Join *join ); + TokenRegion *createRegion( String &name ); + void addRegionDef( const InputLoc &loc, Namespace *nspace, + const String &name, TokenRegion *join ); + void addProduction( const InputLoc &loc, const String &name, + ProdElList *prodElList, bool commit, CodeBlock *redBlock, LangEl *predOf ); + void addArgvList(); + + /* Report an error encountered by the parser. */ + ostream &parse_error( int tokId, Token &token ); + + Compiler *pd; + + /* The name of the root section, this does not change during an include. */ + const char *sectionName; + + NameRef nameRef; + NameRefList nameRefList; + + LangElVect langElVect; + + PatternItemList *patternItemList; + ReplItemList *replItemList; + RegionVect regionStack; + NamespaceVect namespaceStack; + ContextVect contextStack; + + String curDefineId; + LelDefList *curDefList; + ProdElList *curProdElList; + + PredType predType; + ReCaptureVect reCaptureVect; + + bool enterRl; +}; + +%% write token_defs; + +#endif -- cgit v1.2.1