Add a basic AST generator based on https://github.com/rochus-keller/E…

…bnfStudio
SSW-CocoR · mingodad · May 28, 2021 · Jun 1, 2021 · Jun 3, 2021 · Jun 3, 2021
commit 4f22deafabf11a8d25184a273af470f643552426
diff --git a/src/Coco.atg b/src/Coco.atg
@@ -35,6 +35,7 @@ $namespace=Coco
 #include "Tab.h"
 #include "DFA.h"
 #include "ParserGen.h"
+#define COCO_FRAME_PARSER
 
 COMPILER Coco
 
@@ -124,6 +125,13 @@ Coco                            (. Symbol *sym; Graph *g, *g1, *g2; wchar_t* gra
                                 .)
   { ANY }                       (. tab->semDeclPos = new Position(beg, la->pos, 0, line); .)
   [ "IGNORECASE"                (. dfa->ignoreCase = true; .) ]   /* pdt */
+  [ "TERMINALS" { ident 	(. sym = tab->FindSym(t->val);
+                                    if (sym != NULL) SemErr(L"name declared twice");
+                                    else {
+                                     sym = tab->NewSym(Node::t, t->val, t->line);
+                                     sym->tokenKind = Symbol::fixedToken;
+				}.)
+	} ] /*from cocoxml*/
   [ "CHARACTERS" { SetDecl }]
   [ "TOKENS"  { TokenDecl<Node::t> }]
   [ "PRAGMAS" { TokenDecl<Node::pr> }]

diff --git a/src/Parser.cpp b/src/Parser.cpp
diff --git a/src/Parser.frame b/src/Parser.frame
@@ -5,24 +5,24 @@ extended by M. Loeberbauer & A. Woess, Univ. of Linz
 ported to C++ by Csaba Balazs, University of Szeged
 with improvements by Pat Terry, Rhodes University
 
-This program is free software; you can redistribute it and/or modify it 
-under the terms of the GNU General Public License as published by the 
-Free Software Foundation; either version 2, or (at your option) any 
+This program is free software; you can redistribute it and/or modify it
+under the terms of the GNU General Public License as published by the
+Free Software Foundation; either version 2, or (at your option) any
 later version.
 
-This program is distributed in the hope that it will be useful, but 
-WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 
-or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License 
+This program is distributed in the hope that it will be useful, but
+WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 for more details.
 
-You should have received a copy of the GNU General Public License along 
-with this program; if not, write to the Free Software Foundation, Inc., 
+You should have received a copy of the GNU General Public License along
+with this program; if not, write to the Free Software Foundation, Inc.,
 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
 
 As an exception, it is allowed to write an extension of Coco/R that is
 used as a plugin in non-free software.
 
-If not otherwise stated, any source code generated by Coco/R (other than 
+If not otherwise stated, any source code generated by Coco/R (other than
 Coco/R itself) does not fall under the GNU General Public License.
 -------------------------------------------------------------------------*/
 
@@ -41,6 +41,21 @@ Parser.h Specification
 
 -->namespace_open
 
+#ifdef PARSER_WITH_AST
+
+struct SynTree {
+	SynTree(Token *t ): tok(t){}
+        ~SynTree();
+
+	Token *tok;
+	ArrayList children;
+
+	void dump(int indent=0, bool isLast=false);
+	void dump2(int maxT, int indent=0, bool isLast=false);
+};
+
+#endif
+
 class Errors {
 public:
 	int count;			// number of errors detected
@@ -61,6 +76,11 @@ private:
 	int errDist;
 	int minErrDist;
 
+#ifdef PARSER_WITH_AST
+        void AstAddTerminal();
+        bool AstAddNonTerminal(eNonTerminals kind, const char *nt_name, int line);
+        void AstPopNonTerminal();
+#endif
 	void SynErr(int n);
 	void Get();
 	void Expect(int n);
@@ -105,6 +125,30 @@ Parser.cpp Specification
 
 -->namespace_open
 
+#ifdef PARSER_WITH_AST
+
+void Parser::AstAddTerminal() {
+        SynTree *st_t = new SynTree( t->Clone() );
+        ((SynTree*)ast_stack.Top())->children.Add(st_t);
+}
+
+bool Parser::AstAddNonTerminal(eNonTerminals kind, const char *nt_name, int line) {
+        Token *ntTok = new Token();
+        ntTok->kind = kind;
+        ntTok->line = line;
+        ntTok->val = coco_string_create(nt_name);
+        SynTree *st = new SynTree( ntTok );
+        ((SynTree*)ast_stack.Top())->children.Add(st);
+        ast_stack.Add(st);
+        return true;
+}
+
+void Parser::AstPopNonTerminal() {
+        ast_stack.Pop();
+}
+
+#endif
+
 void Parser::SynErr(int n) {
 	if (errDist >= minErrDist) errors.SynErr(la->line, la->col, n);
 	errDist = 0;
@@ -176,7 +220,7 @@ struct ParserInitExistsRecognizer {
 	struct InitIsMissingType {
 		char dummy1;
 	};
-	
+
 	struct InitExistsType {
 		char dummy1; char dummy2;
 	};
@@ -200,7 +244,7 @@ struct ParserDestroyExistsRecognizer {
 	struct DestroyIsMissingType {
 		char dummy1;
 	};
-	
+
 	struct DestroyExistsType {
 		char dummy1; char dummy2;
 	};
@@ -280,8 +324,14 @@ bool Parser::StartOf(int s) {
 Parser::~Parser() {
 	ParserDestroyCaller<Parser>::CallDestroy(this);
 	delete dummyToken;
+#ifdef PARSER_WITH_AST
+        delete ast_root;
+#endif
+
+#ifdef COCO_FRAME_PARSER
         coco_string_delete(noString);
         coco_string_delete(tokenString);
+#endif
 }
 
 Errors::Errors() {
@@ -319,8 +369,60 @@ void Errors::Warning(const wchar_t *s) {
 }
 
 void Errors::Exception(const wchar_t* s) {
-	wprintf(L"%ls", s); 
+	wprintf(L"%ls", s);
 	exit(1);
 }
 
+#ifdef PARSER_WITH_AST
+
+static void printIndent(int n) {
+    for(int i=0; i < n; ++i) wprintf(L" ");
+}
+
+SynTree::~SynTree() {
+    //wprintf(L"Token %ls : %d : %d : %d : %d\n", tok->val, tok->kind, tok->line, tok->col, children.Count);
+    delete tok;
+    for(int i=0; i<children.Count; ++i) delete ((SynTree*)children[i]);
+}
+
+void SynTree::dump(int indent, bool isLast) {
+        int last_idx = children.Count;
+        if(tok->col) {
+            printIndent(indent);
+            wprintf(L"%s\t%d\t%d\t%d\t%ls\n", ((isLast || (last_idx == 0)) ? "= " : " "), tok->line, tok->col, tok->kind, tok->val);
+        }
+        else {
+            printIndent(indent);
+            wprintf(L"%d\t%d\t%d\t%ls\n", children.Count, tok->line, tok->kind, tok->val);
+        }
+        if(last_idx) {
+                for(int idx=0; idx < last_idx; ++idx) ((SynTree*)children[idx])->dump(indent+4, idx == last_idx);
+        }
+}
+
+void SynTree::dump2(int maxT, int indent, bool isLast) {
+        int last_idx = children.Count;
+        if(tok->col) {
+            printIndent(indent);
+            wprintf(L"%s\t%d\t%d\t%d\t%ls\n", ((isLast || (last_idx == 0)) ? "= " : " "), tok->line, tok->col, tok->kind, tok->val);
+        }
+        else {
+            if(last_idx == 1) {
+                if(((SynTree*)children[0])->tok->kind < maxT) {
+                    printIndent(indent);
+                    wprintf(L"%d\t%d\t%d\t%ls\n", children.Count, tok->line, tok->kind, tok->val);
+                }
+            }
+            else {
+                printIndent(indent);
+                wprintf(L"%d\t%d\t%d\t%ls\n", children.Count, tok->line, tok->kind, tok->val);
+            }
+        }
+        if(last_idx) {
+                for(int idx=0; idx < last_idx; ++idx) ((SynTree*)children[idx])->dump2(maxT, indent+4, idx == last_idx);
+        }
+}
+
+#endif
+
 -->namespace_close
diff --git a/src/Parser.h b/src/Parser.h
@@ -33,13 +33,29 @@ Coco/R itself) does not fall under the GNU General Public License.
 #include "Tab.h"
 #include "DFA.h"
 #include "ParserGen.h"
+#define COCO_FRAME_PARSER
 
 
 #include "Scanner.h"
 
 namespace Coco {
 
 
+#ifdef PARSER_WITH_AST
+
+struct SynTree {
+	SynTree(Token *t ): tok(t){}
+        ~SynTree();
+
+	Token *tok;
+	ArrayList children;
+
+	void dump(int indent=0, bool isLast=false);
+	void dump2(int maxT, int indent=0, bool isLast=false);
+};
+
+#endif
+
 class Errors {
 public:
 	int count;			// number of errors detected
@@ -62,15 +78,42 @@ class Parser {
 		_string=3,
 		_badString=4,
 		_char=5,
-		_ddtSym=42,
-		_optionSym=43
+		_ddtSym=43,
+		_optionSym=44
+	};
+#ifdef PARSER_WITH_AST
+	enum eNonTerminals{
+		_Coco=0,
+		_SetDecl=1,
+		_TokenDecl=2,
+		_TokenExpr=3,
+		_Set=4,
+		_AttrDecl=5,
+		_SemText=6,
+		_Expression=7,
+		_SimSet=8,
+		_Char=9,
+		_Sym=10,
+		_Term=11,
+		_Resolver=12,
+		_Factor=13,
+		_Attribs=14,
+		_Condition=15,
+		_TokenTerm=16,
+		_TokenFactor=17
 	};
+#endif
 	int maxT;
 
 	Token *dummyToken;
 	int errDist;
 	int minErrDist;
 
+#ifdef PARSER_WITH_AST
+        void AstAddTerminal();
+        bool AstAddNonTerminal(eNonTerminals kind, const char *nt_name, int line);
+        void AstPopNonTerminal();
+#endif
 	void SynErr(int n);
 	void Get();
 	void Expect(int n);
@@ -85,6 +128,10 @@ class Parser {
 	Token *t;			// last recognized token
 	Token *la;			// lookahead token
 
+#ifdef PARSER_WITH_AST
+	SynTree *ast_root;
+	ArrayList ast_stack;
+#endif
 int id;
 	int str;
 

diff --git a/src/ParserGen.cpp b/src/ParserGen.cpp
@@ -196,11 +196,17 @@ void ParserGen::GenCode (Node *p, int indent, BitArray *isChecked) {
 		} else if (p->typ == Node::t) {
 			Indent(indent);
 			// assert: if isChecked[p->sym->n] is true, then isChecked contains only p->sym->n
-			if ((*isChecked)[p->sym->n]) fwprintf(gen, L"Get();\n");
+			if ((*isChecked)[p->sym->n]) {
+				fwprintf(gen, L"Get();\n");
+				//copy and pasted bellow
+				fwprintf(gen, L"#ifdef PARSER_WITH_AST\n\tAstAddTerminal();\n#endif\n");
+			}
 			else {
 				fwprintf(gen, L"Expect(");
 				WriteSymbolOrCode(gen, p->sym);
 				fwprintf(gen, L");\n");
+				//copy and pasted from above
+				fwprintf(gen, L"#ifdef PARSER_WITH_AST\n\tAstAddTerminal();\n#endif\n");
 			}
 		} if (p->typ == Node::wt) {
 			Indent(indent);
@@ -337,6 +343,19 @@ void ParserGen::GenTokensHeader() {
 	}
 
 	fwprintf(gen, L"\n\t};\n");
+
+        // nonterminals
+        fwprintf(gen, L"#ifdef PARSER_WITH_AST\n\tenum eNonTerminals{\n");
+        isFirst = true;
+        for (i=0; i<tab->nonterminals.Count; i++) {
+                sym = (Symbol*)tab->nonterminals[i];
+                if (isFirst) { isFirst = false; }
+                else { fwprintf(gen , L",\n"); }
+
+                fwprintf(gen , L"\t\t_%ls=%d", sym->name, sym->n);
+        }
+        fwprintf(gen, L"\n\t};\n#endif\n");
+
 }
 
 void ParserGen::GenCodePragmas() {
@@ -380,9 +399,19 @@ void ParserGen::GenProductions() {
 		CopySourcePart(sym->attrPos, 0);
 		fwprintf(gen, L") {\n");
 		CopySourcePart(sym->semPos, 2);
+                fwprintf(gen, L"#ifdef PARSER_WITH_AST\n");
+                if(i == 0) fwprintf(gen, L"\t\tToken *ntTok = new Token(); ntTok->kind = eNonTerminals::_%ls; ntTok->line = 0; ntTok->val = coco_string_create(\"%ls\");ast_root = new SynTree( ntTok ); ast_stack.Clear(); ast_stack.Add(ast_root);\n", sym->name, sym->name);
+                else {
+                        fwprintf(gen, L"\t\tbool ntAdded = AstAddNonTerminal(eNonTerminals::_%ls, \"%ls\", la->line);\n", sym->name, sym->name);
+                }
+                fwprintf(gen, L"#endif\n");
                 ba.SetAll(false);
 		GenCode(sym->graph, 2, &ba);
-		fwprintf(gen, L"}\n"); fwprintf(gen, L"\n");
+                fwprintf(gen, L"#ifdef PARSER_WITH_AST\n");
+                if(i == 0) fwprintf(gen, L"\t\tAstPopNonTerminal();\n");
+                else fwprintf(gen, L"\t\tif(ntAdded) AstPopNonTerminal();\n");
+                fwprintf(gen, L"#endif\n");
+		fwprintf(gen, L"}\n\n");
 	}
 }
 
@@ -405,6 +434,10 @@ void ParserGen::InitSets() {
 	fwprintf(gen, L"\t};\n\n");
 }
 
+void ParserGen::CheckAstGen() {
+        fwprintf(gen, L"#ifdef PARSER_WITH_AST\n\tSynTree *ast_root;\n\tArrayList ast_stack;\n#endif\n");
+}
+
 void ParserGen::WriteParser () {
 	Generator g(tab, errors);
 	int oldPos = buffer->GetPos();  // Pos is modified by CopySourcePart
@@ -437,7 +470,7 @@ void ParserGen::WriteParser () {
 	g.CopyFramePart(L"-->constantsheader");
 	GenTokensHeader();  /* ML 2002/09/07 write the token kinds */
 	fwprintf(gen, L"\tint maxT;\n");
-	g.CopyFramePart(L"-->declarations"); CopySourcePart(tab->semDeclPos, 0);
+	g.CopyFramePart(L"-->declarations"); CheckAstGen(); CopySourcePart(tab->semDeclPos, 0);
 	g.CopyFramePart(L"-->productionsheader"); GenProductionsHeader();
 	g.CopyFramePart(L"-->namespace_close");
 	GenNamespaceClose(nrOfNs);

diff --git a/src/ParserGen.h b/src/ParserGen.h
@@ -90,6 +90,7 @@ class ParserGen
 	void WriteParser();
 	void WriteStatistics();
 	void WriteSymbolOrCode(FILE *gen, const Symbol *sym);
+        void CheckAstGen();
 	ParserGen (Parser *parser);
         ~ParserGen();
 

diff --git a/src/Scanner.cpp b/src/Scanner.cpp
@@ -244,6 +244,17 @@ Token::Token() {
 	next = NULL;
 }
 
+Token *Token::Clone() {
+        Token *tk = new Token();
+	tk->kind = kind;
+	tk->pos = pos;
+	tk->col = col;
+	tk->line = line;
+	tk->val = coco_string_create(val);
+	tk->next = next;
+        return tk;
+}
+
 Token::~Token() {
 	coco_string_delete(val);
 }
@@ -264,7 +275,7 @@ Buffer::Buffer(FILE* s, bool isUserStream) {
 		fileLen = bufLen = bufStart = 0;
 	}
 	bufCapacity = (bufLen>0) ? bufLen : COCO_MIN_BUFFER_LENGTH;
-	buf = new unsigned char[bufCapacity];	
+	buf = new unsigned char[bufCapacity];
 	if (fileLen > 0) SetPos(0);          // setup  buffer to position 0 (start)
 	else bufPos = 0; // index 0 is already after the file, thus Pos = 0 is invalid
 	if (bufLen == fileLen && CanSeek()) Close();
@@ -294,7 +305,7 @@ Buffer::Buffer(const unsigned char* buf, int len) {
 }
 
 Buffer::~Buffer() {
-	Close(); 
+	Close();
 	if (buf != NULL) {
 		delete [] buf;
 		buf = NULL;
@@ -469,8 +480,8 @@ Scanner::~Scanner() {
 void Scanner::Init() {
 	EOL    = '\n';
 	eofSym = 0;
-	maxT = 41;
-	noSym = 41;
+	maxT = 42;
+	noSym = 42;
 	int i;
 	for (i = 65; i <= 90; ++i) start.set(i, 1);
 	for (i = 95; i <= 95; ++i) start.set(i, 1);
@@ -495,21 +506,22 @@ void Scanner::Init() {
 		start.set(Buffer::EoF, -1);
 	keywords.set(L"COMPILER", 6);
 	keywords.set(L"IGNORECASE", 7);
-	keywords.set(L"CHARACTERS", 8);
-	keywords.set(L"TOKENS", 9);
-	keywords.set(L"PRAGMAS", 10);
-	keywords.set(L"COMMENTS", 11);
-	keywords.set(L"FROM", 12);
-	keywords.set(L"TO", 13);
-	keywords.set(L"NESTED", 14);
-	keywords.set(L"IGNORE", 15);
-	keywords.set(L"PRODUCTIONS", 16);
-	keywords.set(L"END", 19);
-	keywords.set(L"ANY", 23);
-	keywords.set(L"WEAK", 29);
-	keywords.set(L"SYNC", 36);
-	keywords.set(L"IF", 37);
-	keywords.set(L"CONTEXT", 38);
+	keywords.set(L"TERMINALS", 8);
+	keywords.set(L"CHARACTERS", 9);
+	keywords.set(L"TOKENS", 10);
+	keywords.set(L"PRAGMAS", 11);
+	keywords.set(L"COMMENTS", 12);
+	keywords.set(L"FROM", 13);
+	keywords.set(L"TO", 14);
+	keywords.set(L"NESTED", 15);
+	keywords.set(L"IGNORE", 16);
+	keywords.set(L"PRODUCTIONS", 17);
+	keywords.set(L"END", 20);
+	keywords.set(L"ANY", 24);
+	keywords.set(L"WEAK", 30);
+	keywords.set(L"SYNC", 37);
+	keywords.set(L"IF", 38);
+	keywords.set(L"CONTEXT", 39);
 
 
 	tvalLength = 128;
@@ -729,14 +741,14 @@ Token* Scanner::NextToken() {
 			{t->kind = 5; break;}
 		case 10:
 			case_10:
-			recEnd = pos; recKind = 42;
+			recEnd = pos; recKind = 43;
 			if ((ch >= L'0' && ch <= L'9') || (ch >= L'A' && ch <= L'Z') || ch == L'_' || (ch >= L'a' && ch <= L'z')) {AddCh(); goto case_10;}
-			else {t->kind = 42; break;}
+			else {t->kind = 43; break;}
 		case 11:
 			case_11:
-			recEnd = pos; recKind = 43;
+			recEnd = pos; recKind = 44;
 			if ((ch >= L'-' && ch <= L'.') || (ch >= L'0' && ch <= L':') || (ch >= L'A' && ch <= L'Z') || ch == L'_' || (ch >= L'a' && ch <= L'z')) {AddCh(); goto case_11;}
-			else {t->kind = 43; break;}
+			else {t->kind = 44; break;}
 		case 12:
 			case_12:
 			if (ch <= 9 || (ch >= 11 && ch <= 12) || (ch >= 14 && ch <= L'!') || (ch >= L'#' && ch <= L'[') || (ch >= L']' && ch <= 65535)) {AddCh(); goto case_12;}
@@ -745,70 +757,70 @@ Token* Scanner::NextToken() {
 			else if (ch == 92) {AddCh(); goto case_14;}
 			else {goto case_0;}
 		case 13:
-			recEnd = pos; recKind = 42;
+			recEnd = pos; recKind = 43;
 			if ((ch >= L'0' && ch <= L'9')) {AddCh(); goto case_10;}
 			else if ((ch >= L'A' && ch <= L'Z') || ch == L'_' || (ch >= L'a' && ch <= L'z')) {AddCh(); goto case_15;}
-			else {t->kind = 42; break;}
+			else {t->kind = 43; break;}
 		case 14:
 			case_14:
 			if ((ch >= L' ' && ch <= L'~')) {AddCh(); goto case_12;}
 			else {goto case_0;}
 		case 15:
 			case_15:
-			recEnd = pos; recKind = 42;
+			recEnd = pos; recKind = 43;
 			if ((ch >= L'0' && ch <= L'9')) {AddCh(); goto case_10;}
 			else if ((ch >= L'A' && ch <= L'Z') || ch == L'_' || (ch >= L'a' && ch <= L'z')) {AddCh(); goto case_15;}
 			else if (ch == L'=') {AddCh(); goto case_11;}
-			else {t->kind = 42; break;}
+			else {t->kind = 43; break;}
 		case 16:
-			{t->kind = 17; break;}
+			{t->kind = 18; break;}
 		case 17:
-			{t->kind = 20; break;}
-		case 18:
 			{t->kind = 21; break;}
+		case 18:
+			{t->kind = 22; break;}
 		case 19:
 			case_19:
-			{t->kind = 22; break;}
+			{t->kind = 23; break;}
 		case 20:
-			{t->kind = 25; break;}
+			{t->kind = 26; break;}
 		case 21:
 			case_21:
-			{t->kind = 26; break;}
+			{t->kind = 27; break;}
 		case 22:
 			case_22:
-			{t->kind = 27; break;}
-		case 23:
 			{t->kind = 28; break;}
+		case 23:
+			{t->kind = 29; break;}
 		case 24:
-			{t->kind = 31; break;}
-		case 25:
 			{t->kind = 32; break;}
-		case 26:
+		case 25:
 			{t->kind = 33; break;}
-		case 27:
+		case 26:
 			{t->kind = 34; break;}
-		case 28:
+		case 27:
 			{t->kind = 35; break;}
+		case 28:
+			{t->kind = 36; break;}
 		case 29:
 			case_29:
-			{t->kind = 39; break;}
+			{t->kind = 40; break;}
 		case 30:
 			case_30:
-			{t->kind = 40; break;}
+			{t->kind = 41; break;}
 		case 31:
-			recEnd = pos; recKind = 18;
+			recEnd = pos; recKind = 19;
 			if (ch == L'.') {AddCh(); goto case_19;}
 			else if (ch == L'>') {AddCh(); goto case_22;}
 			else if (ch == L')') {AddCh(); goto case_30;}
-			else {t->kind = 18; break;}
+			else {t->kind = 19; break;}
 		case 32:
-			recEnd = pos; recKind = 24;
+			recEnd = pos; recKind = 25;
 			if (ch == L'.') {AddCh(); goto case_21;}
-			else {t->kind = 24; break;}
+			else {t->kind = 25; break;}
 		case 33:
-			recEnd = pos; recKind = 30;
+			recEnd = pos; recKind = 31;
 			if (ch == L'.') {AddCh(); goto case_29;}
-			else {t->kind = 30; break;}
+			else {t->kind = 31; break;}
 
 	}
 	AppendVal(t);

diff --git a/src/Scanner.frame b/src/Scanner.frame
@@ -5,24 +5,24 @@ extended by M. Loeberbauer & A. Woess, Univ. of Linz
 ported to C++ by Csaba Balazs, University of Szeged
 with improvements by Pat Terry, Rhodes University
 
-This program is free software; you can redistribute it and/or modify it 
-under the terms of the GNU General Public License as published by the 
-Free Software Foundation; either version 2, or (at your option) any 
+This program is free software; you can redistribute it and/or modify it
+under the terms of the GNU General Public License as published by the
+Free Software Foundation; either version 2, or (at your option) any
 later version.
 
-This program is distributed in the hope that it will be useful, but 
-WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 
-or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License 
+This program is distributed in the hope that it will be useful, but
+WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 for more details.
 
-You should have received a copy of the GNU General Public License along 
-with this program; if not, write to the Free Software Foundation, Inc., 
+You should have received a copy of the GNU General Public License along
+with this program; if not, write to the Free Software Foundation, Inc.,
 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
 
 As an exception, it is allowed to write an extension of Coco/R that is
 used as a plugin in non-free software.
 
-If not otherwise stated, any source code generated by Coco/R (other than 
+If not otherwise stated, any source code generated by Coco/R (other than
 Coco/R itself) does not fall under the GNU General Public License.
 -----------------------------------------------------------------------*/
 
@@ -95,7 +95,7 @@ char* coco_string_create_char(const wchar_t *value);
 void  coco_string_delete(char* &data);
 
 
-class Token  
+class Token
 {
 public:
 	int kind;     // token kind
@@ -107,6 +107,7 @@ public:
 	Token *next;  // ML 2005-03-11 Peek tokens are kept in linked list
 
 	Token();
+        Token *Clone();
 	~Token();
 };
 
@@ -125,18 +126,18 @@ private:
 	int bufPos;         // current position in buffer
 	FILE* stream;       // input stream (seekable)
 	bool isUserStream;  // was the stream opened by the user?
-	
+
 	int ReadNextStreamChunk();
 	bool CanSeek();     // true if stream can be seeked otherwise false
-	
+
 public:
 	static const int EoF = COCO_WCHAR_MAX + 1;
 
 	Buffer(FILE* s, bool isUserStream);
 	Buffer(const unsigned char* buf, int len);
 	Buffer(Buffer *b);
 	virtual ~Buffer();
-	
+
 	virtual void Close();
 	virtual int Read();
 	virtual int Peek();
@@ -284,7 +285,7 @@ private:
 
 public:
 	Buffer *buffer;   // scanner buffer
-	
+
 	Scanner(const unsigned char* buf, int len);
 	Scanner(const wchar_t* fileName);
 	Scanner(FILE* s);
@@ -523,6 +524,17 @@ Token::Token() {
 	next = NULL;
 }
 
+Token *Token::Clone() {
+        Token *tk = new Token();
+	tk->kind = kind;
+	tk->pos = pos;
+	tk->col = col;
+	tk->line = line;
+	tk->val = coco_string_create(val);
+	tk->next = next;
+        return tk;
+}
+
 Token::~Token() {
 	coco_string_delete(val);
 }
@@ -543,7 +555,7 @@ Buffer::Buffer(FILE* s, bool isUserStream) {
 		fileLen = bufLen = bufStart = 0;
 	}
 	bufCapacity = (bufLen>0) ? bufLen : COCO_MIN_BUFFER_LENGTH;
-	buf = new unsigned char[bufCapacity];	
+	buf = new unsigned char[bufCapacity];
 	if (fileLen > 0) SetPos(0);          // setup  buffer to position 0 (start)
 	else bufPos = 0; // index 0 is already after the file, thus Pos = 0 is invalid
 	if (bufLen == fileLen && CanSeek()) Close();
@@ -573,7 +585,7 @@ Buffer::Buffer(const unsigned char* buf, int len) {
 }
 
 Buffer::~Buffer() {
-	Close(); 
+	Close();
 	if (buf != NULL) {
 		delete [] buf;
 		buf = NULL;

diff --git a/src/Scanner.h b/src/Scanner.h
@@ -91,7 +91,7 @@ char* coco_string_create_char(const wchar_t *value);
 void  coco_string_delete(char* &data);
 
 
-class Token  
+class Token
 {
 public:
 	int kind;     // token kind
@@ -103,6 +103,7 @@ class Token
 	Token *next;  // ML 2005-03-11 Peek tokens are kept in linked list
 
 	Token();
+        Token *Clone();
 	~Token();
 };
 
@@ -121,18 +122,18 @@ class Buffer {
 	int bufPos;         // current position in buffer
 	FILE* stream;       // input stream (seekable)
 	bool isUserStream;  // was the stream opened by the user?
-	
+
 	int ReadNextStreamChunk();
 	bool CanSeek();     // true if stream can be seeked otherwise false
-	
+
 public:
 	static const int EoF = COCO_WCHAR_MAX + 1;
 
 	Buffer(FILE* s, bool isUserStream);
 	Buffer(const unsigned char* buf, int len);
 	Buffer(Buffer *b);
 	virtual ~Buffer();
-	
+
 	virtual void Close();
 	virtual int Read();
 	virtual int Peek();
@@ -282,7 +283,7 @@ class Scanner {
 
 public:
 	Buffer *buffer;   // scanner buffer
-	
+
 	Scanner(const unsigned char* buf, int len);
 	Scanner(const wchar_t* fileName);
 	Scanner(FILE* s);

diff --git a/src/Tab.h b/src/Tab.h
@@ -88,7 +88,6 @@ class Tab {
 	ArrayList classes;
 	int dummyName;
 
-
 	Tab(Parser *parser);
         ~Tab();