Context Navigation

parser.yy @ bff09c8

ADTaaron-thesisarm-ehast-experimentalcleanup-dtorsdeferred_resndemanglerenumforall-pointer-decayjacob/cs343-translationjenkins-sandboxnew-astnew-ast-unique-exprnew-envno_listpersistent-indexerpthread-emulationqualifiedEnumresolv-newwith_gc

Last change on this file since bff09c8 was fc1ef62, checked in by Peter A. Buhr <pabuhr@…>, 7 years ago
add %precedence operator precedence
Property mode set to `100644`
File size: 11.7 KB

Line
1	//
2	// Cforall Version 1.0.0 Copyright (C) 2015 University of Waterloo
3	//
4	// The contents of this file are covered under the licence agreement in the
5	// file "LICENCE" distributed with Cforall.
6	//
7	// parser.yy --
8	//
9	// Author : Rodolfo G. Esteves
10	// Created On : Sat Dec 15 13:44:21 2001
11	// Last Modified By : Peter A. Buhr
12	// Last Modified On : Tue Aug 29 16:34:10 2017
13	// Update Count : 1047
14	//
15
16	%{
17	#define YYDEBUG_LEXER_TEXT( yylval ) // lexer loads this up each time
18	#define YYDEBUG 1 // get the pretty debugging code to compile
19
20	#include <iostream>
21	using namespace std;
22	#include "ParserTypes.h"
23	#include "filter.h"
24
25	extern list<string> ws_list; // lex variable containing accumulated whitespace
26	void lexC( void );
27	string lexYacc( void );
28
29	void yyerror( string s ) {
30	extern int yylineno;
31
32	cerr << "Error in line: " << yylineno << ": " << s << endl;
33	return;
34	}
35
36	Token *declstart;
37	Token *rulestart;
38	Token *nameliststart;
39	%}
40
41	%union {
42	Token *tokenp;
43	}
44
45	%token<tokenp> ','
46	%token<tokenp> '<'
47	%token<tokenp> '>'
48	%token<tokenp> '{'
49	%token<tokenp> '}'
50	%token<tokenp> ':'
51	%token<tokenp> ';'
52	%token<tokenp> '\|'
53
54	%token<tokenp> MARK // %%
55	%token<tokenp> LCURL // %{
56	%token<tokenp> RCURL // %}
57
58	%token<tokenp> INTEGER // integer constant
59	%token<tokenp> CHARACTER // character constant
60	%token<tokenp> IDENTIFIER // identifier
61	%token<tokenp> CODE // C code
62
63	%token<tokenp> START // %start
64	%token<tokenp> UNION // %union
65	%token<tokenp> TOKEN // %token
66	%token<tokenp> LEFT // %left
67	%token<tokenp> RIGHT // %right
68	%token<tokenp> NONASSOC // %nonassoc
69	%token<tokenp> PRECEDENCE // %precedence
70	%token<tokenp> TYPE // %type
71	%token<tokenp> PURE_PARSER // %pure_parser
72	%token<tokenp> SEMANTIC_PARSER // %semantic_parser
73	%token<tokenp> EXPECT // %expect
74	%token<tokenp> THONG // %thong
75
76	%token<tokenp> PREC // %prec
77
78	%token END_TERMINALS // ALL TERMINAL TOKEN NAMES MUST APPEAR BEFORE THIS
79
80	%type<tokenp> sections
81	%token _SECTIONS
82	%type<tokenp> mark
83	%type<tokenp> defsection_opt
84	%token _DEFSECTION_OPT
85	%type<tokenp> declarations
86	%type<tokenp> literalblock
87	%token _LITERALBLOCK
88	%type<tokenp> declaration
89	%token _DECLARATION
90	%type<tokenp> union
91	%type<tokenp> rword
92	%type<tokenp> tag_opt
93	%token _TAG_OPT
94	%type<tokenp> namenolist
95	%token _NAMENOLIST
96	%type<tokenp> nameno
97	%token _NAMENO
98	%type<tokenp> namelist
99	%token _NAMELIST
100	%type<tokenp> name
101	%type<tokenp> rulesection
102	%token _RULESECTION
103	%type<tokenp> rules
104	%token _RULE
105	%type<tokenp> lhs
106	%token _LHS
107	%type<tokenp> rhs
108	%token _RHS
109	%type<tokenp> prod
110	%type<tokenp> prec
111	%token _PREC
112	%type<tokenp> action
113	%token _ACTION
114	%type<tokenp> usersection_opt
115	%token _USERSECTION_OPT
116	%type<tokenp> ccode_opt
117	%type<tokenp> blocks
118
119	%start grammar
120
121	%%
122	grammar :
123	sections
124	{
125	filter( $1 ); // filter parse tree
126	freeTree( $1 ); // free parse-tree storage (optional: used with purify)
127	}
128	;
129
130	sections :
131	defsection_opt mark rulesection usersection_opt
132	{
133	$$ = new Token( "sections", _SECTIONS );
134	$1->left = $2;
135	$2->left = $3;
136	$3->left = $4;
137	$$->down = $1;
138	}
139	;
140
141	mark :
142	MARK
143	\| error // missing %%
144	{
145	cerr << "no input grammar, missing %% mark" << endl;
146	exit( -1 );
147	}
148	;
149
150	defsection_opt :
151	// empty
152	{
153	//cerr << "defsection_opt1: " << endl;
154	$$ = new Token( "declaration_opt", _DEFSECTION_OPT );
155	}
156	\| declarations
157	{
158	//cerr << "defsection_opt2: " << $1->text << "(" << $1 << ")" << endl;
159	$$ = new Token( "declaration_opt", _DEFSECTION_OPT );
160	$$->down = declstart;
161	}
162	;
163
164	declarations :
165	literalblock
166	{
167	//cerr << "declarations1: " << $1->text << "(" << $1 << ")" << endl;
168	$$ = declstart = $1;
169	}
170	\| declaration
171	{
172	//cerr << "declarations2: " << $1->text << "(" << $1 << ")" << endl;
173	$$ = declstart = new Token( "declaration", _DECLARATION );
174	$$->down = $1;
175	}
176	\| declarations literalblock
177	{
178	//cerr << "declarations3: "<< $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
179	$1->left = $2;
180	$$ = $2;
181	}
182	\| declarations declaration
183	{
184	//cerr << "declarations4: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
185	$$ = new Token( "declaration", _DECLARATION );
186	$1->left = $$;
187	$$->down = $2;
188	}
189	;
190
191	literalblock :
192	LCURL
193	{ lexC(); }
194	ccode_opt
195	{ $<tokenp>$ = new Token( lexYacc(), CODE ); }
196	RCURL
197	{
198	//cerr << "literalblock: " << $1->text << "(" << $1 << ") " << $<tokenp>4->text << " " << $5->text << "(" << $5 << ")" << endl;
199	$1->left = $<tokenp>4;
200	$<tokenp>4->left = $5;
201	$$ = new Token( "literalblock", _LITERALBLOCK );
202	$$->down = $1;
203	}
204	;
205
206	declaration :
207	union
208	\| START IDENTIFIER
209	{
210	$1->left = $2;
211	$$ = $1;
212	}
213	\| rword tag_opt namenolist
214	{
215	Token *n = new Token( "namenolist", _NAMENOLIST );
216	n->down = nameliststart;
217	$1->left = $2;
218	$2->left = n;
219	$$ = $1;
220	}
221	\| TYPE tag_opt namelist
222	{
223	Token *n = new Token( "namelist", _NAMELIST );
224	n->down = nameliststart;
225	$1->left = $2;
226	$2->left = n;
227	$$ = $1;
228	}
229	\| PURE_PARSER
230	\| SEMANTIC_PARSER
231	\| EXPECT INTEGER // bison
232	{
233	$1->left = $2;
234	$$ = $1;
235	}
236	\| THONG // bison
237	;
238
239	union :
240	UNION '{'
241	{ lexC(); }
242	ccode_opt
243	{
244	// Remove the trailing '}' which is added in lex.
245	string temp( lexYacc() );
246	$<tokenp>$ = new Token( temp.substr( 0, temp.length() - 1 ), CODE );
247	}
248	'}'
249	{
250	$1->left = $2;
251	$2->left = $<tokenp>5;
252	$<tokenp>5->left = $6;
253	$$ = $1;
254	}
255	;
256
257	rword :
258	TOKEN
259	\| LEFT
260	\| RIGHT
261	\| NONASSOC
262	\| PRECEDENCE
263	;
264
265	tag_opt :
266	// empty
267	{
268	//cerr << "tag_opt" << endl;
269	$$ = new Token( "tag_opt", _TAG_OPT );
270	}
271	\| '<' IDENTIFIER '>'
272	{
273	$1->left = $2;
274	$2->left = $3;
275	$$ = new Token( "tag_opt", _TAG_OPT );
276	$$->down = $1;
277	}
278	;
279
280	namenolist :
281	nameno
282	{
283	//cerr << "namenolist1: " << $1->text << "(" << $1 << ")" << endl;
284	$$ = nameliststart = $1;
285	}
286	\| namenolist nameno
287	{
288	//cerr << "namenolist2: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
289	$1->left = $2;
290	$$ = $2;
291	}
292	\| namenolist ',' nameno
293	{
294	//cerr << "namenolist3: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ") " << $3->text << "(" << $3 << ")" << endl;
295	$1->left = $2;
296	$2->left = $3;
297	$$ = $3;
298	}
299	;
300
301	nameno :
302	name
303	{
304	$$ = new Token( "nameno", _NAMENO );
305	$$->down = $1;
306	}
307	\| name INTEGER
308	{
309	$$ = new Token( "nameno", _NAMENO );
310	$1->left = $2;
311	$$->down = $1;
312	}
313	;
314
315	namelist :
316	name
317	{
318	//cerr << "namelist1: " << $1->text << "(" << $1 << ")" << endl;
319	$$ = nameliststart = $1;
320	}
321	\| namelist name
322	{
323	//cerr << "namelist2: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
324	$1->left = $2;
325	$$ = $2;
326	}
327	\| namelist ',' name
328	{
329	//cerr << "namelist3: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ") " << $3->text << "(" << $3 << ")" << endl;
330	$1->left = $2;
331	$2->left = $3;
332	$$ = $3;
333	}
334	;
335
336	name :
337	IDENTIFIER
338	\| CHARACTER
339	;
340
341	rulesection :
342	rules
343	{
344	//cerr << "rulesection1: " << $1->text << "(" << $1 << ")" << endl;
345	$$ = new Token( "rulesection", _RULESECTION );
346	$$->down = $1;
347	}
348	\| error // no rules
349	{
350	cerr << "no rules in the input grammar" << endl;
351	exit( -1 );
352	}
353	;
354
355	// These grammar rules are complex because the Yacc language is LR(2) due to the optional ';' at the end of rules. The
356	// following rules convert the LR(2) grammar into LR(1) by lengthening the rules to allow sufficient look
357	// ahead. Unfortunately, this change makes handling the semantic actions more complex because there are two lists
358	// (rules, rhs) being built but only one list tail can be returned through $$ for chaining.
359
360	rules :
361	lhs rhs
362	{
363	//cerr << "rules1: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
364	$$ = rulestart;
365	}
366	\| lhs rhs ';'
367	{
368	//cerr << "rules2: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ") " << $3->text << "(" << $3 << ")" << endl;
369	$2->addDownLeftTail( $3 );
370	$$ = rulestart;
371	}
372	;
373
374	lhs :
375	IDENTIFIER ':'
376	{
377	//cerr << "lhs: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
378	$$ = new Token( "lhs", _LHS );
379	//cerr << " lhs: " << $$->text << "(" << $$ << ")" << endl;
380	$1->left = $2;
381	$$->down = $1;
382	}
383	;
384
385	rhs :
386	// empty
387	{
388	//cerr << "rhs1: " << $<tokenp>0->text << "(" << $<tokenp>0 << ")" << endl;
389	rulestart = new Token( "rule", _RULE );
390	rulestart->down = $<tokenp>0; // initial lhs is already on the stack from "rules"
391	$$ = new Token( "rhs", _RHS );
392	//cerr << " rhs: " << $$->text << "(" << $$ << ")" << endl;
393	$<tokenp>0->left = $$;
394	}
395	\| rhs lhs
396	{
397	//cerr << "rhs2: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
398	Token *temp = new Token( "rule", _RULE );
399	rulestart->addLeftTail( temp );
400	temp->down = $2;
401	$$ = new Token( "rhs", _RHS );
402	//cerr << " rhs: " << $$->text << "(" << $$ << ")" << endl;
403	$2->left = $$;
404	}
405	\| rhs ';' lhs
406	{
407	//cerr << "rhs3: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ") " << $3->text << "(" << $3 << ")" << endl;
408	$1->addDownLeftTail( $2 );
409	Token *temp = new Token( "rule", _RULE );
410	rulestart->addLeftTail( temp );
411	temp->down = $3;
412	$$ = new Token( "rhs", _RHS );
413	//cerr << " rhs: " << $$->text << "(" << $$ << ")" << endl;
414	$3->left = $$;
415	}
416	\| rhs prod
417	{
418	//cerr << "rhs4: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
419	$1->addDownLeftTail( $2 );
420	$$ = $1;
421	}
422	\| rhs '\|'
423	{
424	//cerr << "rhs5: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
425	$1->addDownLeftTail( $2 );
426	$$ = new Token( "rhs", _RHS );
427	$1->left = $$;
428	//cerr << " rhs: " << $$->text << "(" << $$ << ")" << endl;
429	}
430	;
431
432	prod :
433	action
434	\| IDENTIFIER
435	\| CHARACTER
436	\| prec
437	;
438
439	prec :
440	PREC name
441	{
442	//cerr << "prec: " << $1->text << "(" << $1 << ") " << $2->text << "(" << $2 << ")" << endl;
443	$1->left = $2;
444	$$ = new Token( "prec", _PREC );
445	$$->down = $1;
446	}
447	;
448
449	action :
450	'{'
451	{ lexC(); }
452	ccode_opt
453	{
454	// Remove the trailing '}' added in lex.
455	string temp( lexYacc() );
456	$<tokenp>$ = new Token( temp.substr( 0, temp.length() - 1 ), CODE );
457	}
458	'}'
459	{
460	$1->left = $<tokenp>4;
461	$<tokenp>4->left = $5;
462	$$ = new Token( "action", _ACTION );
463	$$->down = $1;
464	}
465	;
466
467	usersection_opt :
468	// empty
469	{
470	//cerr << "usersection_opt" << endl;
471	// attach remaining WS to fictitious code
472	Token *temp = new Token( "", ws_list, CODE );
473	$$ = new Token( "usersection_opt", _USERSECTION_OPT );
474	$$->down = temp;
475	}
476	\| MARK
477	{ lexC(); }
478	ccode_opt
479	{
480	Token *temp = new Token( lexYacc(), CODE );
481	//cerr << "usersection_opt: " << $1->text << " " << temp->text << endl;
482	$1->left = temp;
483	$$ = new Token( "usersection_opt", _USERSECTION_OPT );
484	$$->down = $1;
485	}
486	;
487
488	ccode_opt :
489	// empty
490	{}
491	\| blocks
492	;
493
494	// This rule matches internal braces "{}" in C code to the level of the braces of a union/action. These internal braces
495	// are returned as Tokens from the lexer but are unused because the braces are already concatenated into the code string
496	// built by the lexer. Therefore, the tokens for the braces are immediately deleted.
497
498	blocks :
499	'{'
500	{ delete $1; }
501	ccode_opt '}'
502	{ delete $4; }
503	\| blocks '{'
504	{ delete $2; }
505	ccode_opt '}'
506	{ delete $5; }
507	;
508	%%
509
510	// Local Variables: //
511	// mode: c++ //
512	// tab-width: 4 //
513	// compile-command: "make install" //
514	// End: //

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Original Format