]>
Commit | Line | Data |
---|---|---|
3cedc2dc AD |
1 | #! /usr/bin/perl -w |
2 | ||
7d6bad19 | 3 | # Copyright (C) 2006, 2008-2013 Free Software Foundation, Inc. |
f16b0819 | 4 | # |
3cedc2dc | 5 | # This file is part of Bison, the GNU Compiler Compiler. |
f16b0819 PE |
6 | # |
7 | # This program is free software: you can redistribute it and/or modify | |
3cedc2dc | 8 | # it under the terms of the GNU General Public License as published by |
f16b0819 PE |
9 | # the Free Software Foundation, either version 3 of the License, or |
10 | # (at your option) any later version. | |
11 | # | |
12 | # This program is distributed in the hope that it will be useful, | |
3cedc2dc AD |
13 | # but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | # GNU General Public License for more details. | |
f16b0819 | 16 | # |
3cedc2dc | 17 | # You should have received a copy of the GNU General Public License |
f16b0819 PE |
18 | # along with this program. If not, see <http://www.gnu.org/licenses/>. |
19 | ||
15129f25 AD |
20 | =head1 NAME |
21 | ||
f10e19fd | 22 | bench.pl - bench marks for Bison parsers. |
15129f25 AD |
23 | |
24 | =head1 SYNOPSIS | |
25 | ||
9b0efa5b | 26 | ./bench.pl [OPTIONS]... DIRECTIVES |
15129f25 | 27 | |
f10e19fd | 28 | =head1 DIRECTIVES |
a6df593d | 29 | |
f10e19fd AD |
30 | Specify the set of benches to run. The following grammar defines the |
31 | I<directives>: | |
32 | ||
c17f9a4a AD |
33 | directives ::= |
34 | directives | directives -- Alternation | |
35 | | directives & directives -- Concatenation | |
36 | | [ directives> ] -- Optional | |
37 | | ( directives> ) -- Parentheses | |
ca42755f | 38 | | %b PATH -- Use bison at PATH for this bench |
fce629c0 AD |
39 | | #d NAME[=VALUE] -- %code { #define NAME [VALUE] } |
40 | | %d NAME[=VALUE] -- %define NAME ["VALUE"] | |
c17f9a4a | 41 | | %s skeleton -- %skeleton "skeleton" |
c17f9a4a | 42 | | directive |
f10e19fd AD |
43 | |
44 | Parentheses only group to override precedence. For instance: | |
45 | ||
46 | [ %debug ] & [ %error-verbose ] & [ %define variant ] | |
47 | ||
48 | will generate eight different cases. | |
49 | ||
50 | =head1 OPTIONS | |
51 | ||
52 | =over 4 | |
53 | ||
54 | =item B<-b>, B<--bench> | |
55 | ||
56 | Predefined benches, that is, combimation between a grammar and a I<directives> | |
57 | request. | |
a6df593d AD |
58 | |
59 | =over 4 | |
60 | ||
a6df593d AD |
61 | =item I<push> |
62 | ||
63 | Test the push parser vs. the pull interface. Use the C parser. | |
64 | ||
65 | =item I<variant> | |
66 | ||
67 | Test the use of variants instead of union in the C++ parser. | |
68 | ||
69 | =back | |
70 | ||
7e5f9c54 AD |
71 | =item B<-c>, B<--cflags>=I<flags> |
72 | ||
ef05c4d6 AD |
73 | Flags to pass to the C or C++ compiler. Defaults to -O2. |
74 | ||
757f8f98 AD |
75 | =item B<-d>, B<--directive>=I<directives> |
76 | ||
77 | Add a set of Bison directives to bench against each other. | |
78 | ||
f10e19fd AD |
79 | =item B<-g>, B<--grammar>=I<grammar> |
80 | ||
81 | Select the base I<grammar> to use. Defaults to I<calc>. | |
82 | ||
83 | =over 4 | |
84 | ||
85 | =item I<calc> | |
86 | ||
87 | Traditional calculator. | |
88 | ||
89 | =item I<list> | |
90 | ||
91 | C++ grammar that uses std::string and std::list. Can be used with | |
92 | or without %define variant. | |
93 | ||
94 | =item I<triangular> | |
95 | ||
96 | Artificial grammar with very long rules. | |
97 | ||
98 | =back | |
99 | ||
ef05c4d6 AD |
100 | =item B<-h>, B<--help> |
101 | ||
102 | Display this message and exit succesfully. The more verbose, the more | |
103 | details. | |
7e5f9c54 AD |
104 | |
105 | =item B<-i>, B<--iterations>=I<integer> | |
106 | ||
d11ee647 AD |
107 | Say how many times a single test of the bench must be run. If |
108 | negative, specify the minimum number of CPU seconds to run. Defaults | |
ef05c4d6 AD |
109 | to -1. |
110 | ||
111 | =item B<-q>, B<--quiet> | |
112 | ||
113 | Decrease the verbosity level (defaults to 1). | |
7e5f9c54 AD |
114 | |
115 | =item B<-v>, B<--verbose> | |
116 | ||
ef05c4d6 | 117 | Raise the verbosity level (defaults to 1). |
7e5f9c54 | 118 | |
e1b74b92 AD |
119 | =back |
120 | ||
15129f25 AD |
121 | =cut |
122 | ||
3a2803df | 123 | use strict; |
3cedc2dc | 124 | use IO::File; |
3cedc2dc | 125 | |
e1b74b92 AD |
126 | ################################################################## |
127 | ||
128 | =head1 VARIABLES | |
129 | ||
130 | =over 4 | |
131 | ||
3a2803df AD |
132 | =item C<@bench> |
133 | ||
134 | The list of benches to run. | |
135 | ||
e1b74b92 AD |
136 | =item C<$bison> |
137 | ||
138 | The Bison program to use to compile the grammar. | |
139 | ||
140 | =item C<$cc> | |
141 | ||
142 | The C compiler. | |
143 | ||
144 | =item C<$cxx> | |
145 | ||
146 | The C++ compiler. | |
147 | ||
148 | =item C<$cflags> | |
149 | ||
150 | Compiler flags (C or C++). | |
151 | ||
757f8f98 AD |
152 | =item C<@directive> |
153 | ||
154 | A list of directive sets to measure against each other. | |
155 | ||
e1b74b92 AD |
156 | =item C<$iterations> |
157 | ||
158 | The number of times the parser is run for a bench. | |
159 | ||
160 | =item C<$verbose> | |
161 | ||
162 | Verbosity level. | |
163 | ||
164 | =back | |
165 | ||
166 | =cut | |
167 | ||
f10e19fd | 168 | my $bench; |
2e7944cb | 169 | my $bison = $ENV{'BISON'} || '@abs_top_builddir@/tests/bison'; |
3cedc2dc | 170 | my $cc = $ENV{'CC'} || 'gcc'; |
7109a18d | 171 | my $cxx = $ENV{'CXX'} || 'g++'; |
ef05c4d6 | 172 | my $cflags = '-O2'; |
757f8f98 | 173 | my @directive = (); |
f10e19fd | 174 | my $grammar = 'calc'; |
ef05c4d6 AD |
175 | my $iterations = -1; |
176 | my $verbose = 1; | |
3cedc2dc | 177 | |
e1b74b92 | 178 | =head1 FUNCTIONS |
3cedc2dc | 179 | |
e1b74b92 | 180 | =over 4 |
7e5f9c54 | 181 | |
e1b74b92 | 182 | =item C<verbose($level, $message)> |
15129f25 | 183 | |
e1b74b92 AD |
184 | Report the C<$message> is C<$level> E<lt>= C<$verbose>. |
185 | ||
186 | =cut | |
187 | ||
188 | sub verbose($$) | |
189 | { | |
190 | my ($level, $message) = @_; | |
191 | print STDERR $message | |
192 | if $level <= $verbose; | |
193 | } | |
15129f25 | 194 | |
3a2803df AD |
195 | |
196 | ###################################################################### | |
197 | ||
922730fe AD |
198 | =item C<directives($bench, @directive)> |
199 | ||
200 | Format the list of directives for Bison for bench named C<$bench>. | |
201 | ||
202 | =cut | |
203 | ||
204 | sub directives($@) | |
205 | { | |
5b421a4e | 206 | my ($bench, @directive) = @_; |
922730fe | 207 | my $res = "/* Directives for bench `$bench'. */\n"; |
f6038cb8 | 208 | $res .= join ("\n", @directive) . "\n"; |
922730fe AD |
209 | $res .= "/* End of directives for bench `$bench'. */\n"; |
210 | return $res; | |
211 | } | |
212 | ||
3a2803df AD |
213 | ###################################################################### |
214 | ||
215 | =item C<generate_grammar_triangular ($base, $max, @directive)> | |
15129f25 AD |
216 | |
217 | Create a large triangular grammar which looks like : | |
218 | ||
219 | input: | |
220 | exp { if ($1 != 0) abort (); $$ = $1; } | |
221 | | input exp { if ($2 != $1 + 1) abort (); $$ = $2; } | |
222 | ; | |
223 | ||
224 | exp: | |
225 | END { $$ = 0; } | |
226 | | "1" END { $$ = 1; } | |
227 | | "1" "2" END { $$ = 2; } | |
228 | | "1" "2" "3" END { $$ = 3; } | |
229 | | "1" "2" "3" "4" END { $$ = 4; } | |
230 | | "1" "2" "3" "4" "5" END { $$ = 5; } | |
231 | ; | |
232 | ||
7e5f9c54 | 233 | C<$base> is the base name for the file to create (F<$base.y>). |
15129f25 | 234 | C<$max> is the number of such rules (here, 5). You may pass |
5b421a4e | 235 | additional Bison C<@directive>. |
15129f25 AD |
236 | |
237 | The created parser is self contained: it includes its scanner, and | |
238 | source of input. | |
239 | =cut | |
240 | ||
3a2803df | 241 | sub generate_grammar_triangular ($$@) |
3cedc2dc | 242 | { |
5b421a4e AD |
243 | my ($base, $max, @directive) = @_; |
244 | my $directives = directives ($base, @directive); | |
3cedc2dc AD |
245 | |
246 | my $out = new IO::File ">$base.y" | |
247 | or die; | |
248 | print $out <<EOF; | |
249 | %error-verbose | |
3cedc2dc AD |
250 | %{ |
251 | #include <stdio.h> | |
252 | #include <stdlib.h> | |
253 | ||
254 | static int yylex (void); | |
255 | static void yyerror (const char *msg); | |
256 | %} | |
922730fe | 257 | $directives |
3cedc2dc AD |
258 | %union |
259 | { | |
260 | int val; | |
261 | }; | |
262 | ||
263 | %token END "end" | |
264 | %type <val> exp input | |
265 | EOF | |
266 | ||
267 | for my $size (1 .. $max) | |
268 | { | |
269 | print $out "%token t$size $size \"$size\"\n"; | |
270 | }; | |
271 | ||
272 | print $out <<EOF; | |
273 | %% | |
274 | input: | |
275 | exp { if (\$1 != 0) abort (); \$\$ = \$1; } | |
276 | | input exp { if (\$2 != \$1 + 1) abort (); \$\$ = \$2; } | |
277 | ; | |
278 | ||
279 | exp: | |
280 | END | |
281 | { \$\$ = 0; } | |
282 | EOF | |
283 | ||
284 | for my $size (1 .. $max) | |
285 | { | |
286 | use Text::Wrap; | |
287 | print $out wrap ("| ", " ", | |
e9690142 JD |
288 | (map { "\"$_\"" } (1 .. $size)), |
289 | " END \n"), | |
3cedc2dc AD |
290 | " { \$\$ = $size; }\n"; |
291 | }; | |
292 | print $out ";\n"; | |
293 | ||
294 | print $out <<EOF; | |
295 | %% | |
296 | static int | |
297 | yylex (void) | |
298 | { | |
299 | static int inner = 1; | |
300 | static int outer = 0; | |
301 | if (outer > $max) | |
302 | return 0; | |
303 | else if (inner > outer) | |
304 | { | |
305 | inner = 1; | |
306 | ++outer; | |
307 | return END; | |
308 | } | |
309 | return inner++; | |
310 | } | |
311 | ||
312 | static void | |
313 | yyerror (const char *msg) | |
314 | { | |
315 | fprintf (stderr, "%s\\n", msg); | |
316 | } | |
317 | ||
318 | int | |
319 | main (void) | |
320 | { | |
37318e2f | 321 | #if YYDEBUG |
3cedc2dc | 322 | yydebug = !!getenv ("YYDEBUG"); |
37318e2f | 323 | #endif |
3cedc2dc AD |
324 | return yyparse (); |
325 | } | |
326 | EOF | |
327 | } | |
328 | ||
329 | ################################################################## | |
330 | ||
15129f25 AD |
331 | =item C<calc_input ($base, $max)> |
332 | ||
7e5f9c54 | 333 | Generate the input file F<$base.input> for the calc parser. The input |
15129f25 AD |
334 | is composed of two expressions. The first one is using left recursion |
335 | only and consumes no stack. The second one requires a deep stack. | |
336 | These two expressions are repeated C<$max> times in the output file. | |
337 | ||
338 | =cut | |
339 | ||
3cedc2dc AD |
340 | sub calc_input ($$) |
341 | { | |
342 | my ($base, $max) = @_; | |
343 | my $out = new IO::File ">$base.input" | |
344 | or die; | |
345 | foreach (1 .. $max) | |
346 | { | |
347 | print $out "0+1+2+3+4+5+6+7+8+9+10+11+12+13+14+15+16+17+18+19+20+21+22+23+24+25+26+27+28+29+30+31+32+33+34+35+36+37+38+39+40+41+42+43+44+45+46+47+48+49+50+51+52+53+54+55+56+57+58+59+60+61+62+63+64+65+66+67+68+69+70+71+72+73+74+75+76+77+78+79+80+81+82+83+84+85+86+87+88+89+90+91+92+93+94+95+96+97+98+99\n"; | |
348 | print $out "1+1*(2+2*(3+3*(4+4*(5+5*(6+6*(7+7*(8+8*(9+9*(10+10*(11+11*(12+12*(13+13*(14+14*(15+15*(16+16*(17+17*(18+18*(19+19*(20+20*(21+21*(22+22*(23+23*(24+24*(25+25*(26+26*(27+27*(28+28*(29+29*(30+30*(31+31*(32+32*(33+33*(34+34*(35+35*(36+36*(37+37*(38+38*(39+39*(40+40*(41+41*(42+42*(43+43*(44+44*(45+45*(46+46*(47+47*(48+48*(49+49*(50+50*(51+51*(52+52*(53+53*(54+54*(55+55*(56+56*(57+57*(58+58*(59+59*(60+60*(61+61*(62+62*(63+63*(64+64*(65+65*(66+66*(67+67*(68+68*(69+69*(70+70*(71+71*(72+72*(73+73*(74+74*(75+75*(76+76*(77+77*(78+78*(79+79*(80+80*(81+81*(82+82*(83+83*(84+84*(85+85*(86+86*(87+87*(88+88*(89+89*(90+90*(91+91*(92+92*(93+93*(94+94*(95+95*(96+96*(97+97*(98+98*(99+99*(100+100*(101+101*(102+102*(103+103*(104+104*(105+105*(106+106*(107+107*(108+108*(109+109*(110+110*(111+111*(112+112*(113+113*(114+114*(115+115*(116+116*(117+117*(118+118*(119+119*(120+120*(121+121*(122+122*(123+123*(124+124*(125+125*(126+126*(127+127*(128+128*(129+129*(130+130*(131+131*(132+132*(133+133*(134+134*(135+135*(136+136*(137+137*(138+138*(139+139*(140+140*(141+141*(142+142*(143+143*(144+144*(145+145*(146+146*(147+147*(148+148*(149+149*(150+150*(151+151*(152+152*(153+153*(154+154*(155+155*(156+156*(157+157*(158+158*(159+159*(160+160*(161+161*(162+162*(163+163*(164+164*(165+165*(166+166*(167+167*(168+168*(169+169*(170+170*(171+171*(172+172*(173+173*(174+174*(175+175*(176+176*(177+177*(178+178*(179+179*(180+180*(181+181*(182+182*(183+183*(184+184*(185+185*(186+186*(187+187*(188+188*(189+189*(190+190*(191+191*(192+192*(193+193*(194+194*(195+195*(196+196*(197+197*(198+198*(199+199*(200+200*(201+201*(202+202*(203+203*(204+204*(205+205*(206+206*(207+207*(208+208*(209+209*(210+210*(211+211*(212+212*(213+213*(214+214*(215+215*(216+216*(217+217*(218+218*(219+219*(220+220*(221+221*(222+222*(223+223*(224+224*(225+225*(226+226*(227+227*(228+228*(229+229*(230+230*(231+231*(232+232*(233+233*(234+234*(235+235*(236+236*(237+237*(238+238*(239+239*(240+240*(241+241*(242+242*(243+243*(244+244*(245+245*(246+246*(247+247*(248+248*(249+249*(250+250*(251+251*(252+252*(253+253*(254+254*(255+255*(256+256*(257+257*(258+258*(259+259*(260+260*(261+261*(262+262*(263+263*(264+264*(265+265*(266+266*(267+267*(268+268*(269+269*(270+270*(271+271*(272+272*(273+273*(274+274*(275+275*(276+276*(277+277*(278+278*(279+279*(280+280*(281+281*(282+282*(283+283*(284+284*(285+285*(286+286*(287+287*(288+288*(289+289*(290+290*(291+291*(292+292*(293+293*(294+294*(295+295*(296+296*(297+297*(298+298*(299+299*(300+300*(301+301*(302+302*(303+303*(304+304*(305+305*(306+306*(307+307*(308+308*(309+309*(310+310*(311+311*(312+312*(313+313*(314+314*(315+315*(316+316*(317+317*(318+318*(319+319*(320+320*(321+321*(322+322*(323+323*(324+324*(325+325*(326+326*(327+327*(328+328*(329+329*(330+330*(331+331*(332+332*(333+333*(334+334*(335+335*(336+336*(337+337*(338+338*(339+339*(340+340*(341+341*(342+342*(343+343*(344+344*(345+345*(346+346*(347+347*(348+348*(349+349*(350+350*(351+351*(352+352*(353+353*(354+354*(355+355*(356+356*(357+357*(358+358*(359+359*(360+360*(361+361*(362+362*(363+363*(364+364*(365+365*(366+366*(367+367*(368+368*(369+369*(370+370*(371+371*(372+372*(373+373*(374+374*(375+375*(376+376*(377+377*(378+378*(379+379*(380+380*(381+381*(382+382*(383+383*(384+384*(385+385*(386+386*(387+387*(388+388*(389+389*(390+390*(391+391*(392+392*(393+393*(394+394*(395+395*(396+396*(397+397*(398+398*(399+399*(400+400*(401+401*(402+402*(403+403*(404+404*(405+405*(406+406*(407+407*(408+408*(409+409*(410+410*(411+411*(412+412*(413+413*(414+414*(415+415*(416+416*(417+417*(418+418*(419+419*(420+420*(421+421*(422+422*(423+423*(424+424*(425+425*(426+426*(427+427*(428+428*(429+429*(430+430*(431+431*(432+432*(433+433*(434+434*(435+435*(436+436*(437+437*(438+438*(439+439*(440+440*(441+441*(442+442*(443+443*(444+444*(445+445*(446+446*(447+447*(448+448*(449+449*(450+450*(451+451*(452+452*(453+453*(454+454*(455+455*(456+456*(457+457*(458+458*(459+459*(460+460*(461+461*(462+462*(463+463*(464+464*(465+465*(466+466*(467+467*(468+468*(469+469*(470+470*(471+471*(472+472*(473+473*(474+474*(475+475*(476+476*(477+477*(478+478*(479+479*(480+480*(481+481*(482+482*(483+483*(484+484*(485+485*(486+486*(487+487*(488+488*(489+489*(490+490*(491+491*(492+492*(493+493*(494+494*(495+495*(496+496*(497+497*(498+498*(499+499*(500+500*(501+501*(502+502*(503+503*(504+504*(505+505*(506+506*(507+507*(508+508*(509+509*(510+510*(511+511*(512+512*(513+513*(514+514*(515+515*(516+516*(517+517*(518+518*(519+519*(520+520*(521+521*(522+522*(523+523*(524+524*(525+525*(526+526*(527+527*(528+528*(529+529*(530+530*(531+531*(532+532*(533+533*(534+534*(535+535*(536+536*(537+537*(538+538*(539+539*(540+540*(541+541*(542+542*(543+543*(544+544*(545+545*(546+546*(547+547*(548+548*(549+549*(550+550*(551+551*(552+552*(553+553*(554+554*(555+555*(556+556*(557+557*(558+558*(559+559*(560+560*(561+561*(562+562*(563+563*(564+564*(565+565*(566+566*(567+567*(568+568*(569+569*(570+570*(571+571*(572+572*(573+573*(574+574*(575+575*(576+576*(577+577*(578+578*(579+579*(580+580*(581+581*(582+582*(583+583*(584+584*(585+585*(586+586*(587+587*(588+588*(589+589*(590+590*(591+591*(592+592*(593+593*(594+594*(595+595*(596+596*(597+597*(598+598*(599+599*(600+600*(601+601*(602+602*(603+603*(604+604*(605+605*(606+606*(607+607*(608+608*(609+609*(610+610*(611+611*(612+612*(613+613*(614+614*(615+615*(616+616*(617+617*(618+618*(619+619*(620+620*(621+621*(622+622*(623+623*(624+624*(625+625*(626+626*(627+627*(628+628*(629+629*(630+630*(631+631*(632+632*(633+633*(634+634*(635+635*(636+636*(637+637*(638+638*(639+639*(640+640*(641+641*(642+642*(643+643*(644+644*(645+645*(646+646*(647+647*(648+648*(649+649*(650+650*(651+651*(652+652*(653+653*(654+654*(655+655*(656+656*(657+657*(658+658*(659+659*(660+660*(661+661*(662+662*(663+663*(664+664*(665+665*(666+666*(667+667*(668+668*(669+669*(670+670*(671+671*(672+672*(673+673*(674+674*(675+675*(676+676*(677+677*(678+678*(679+679*(680+680*(681+681*(682+682*(683+683*(684+684*(685+685*(686+686*(687+687*(688+688*(689+689*(690+690*(691+691*(692+692*(693+693*(694+694*(695+695*(696+696*(697+697*(698+698*(699+699*(700+700*(701+701*(702+702*(703+703*(704+704*(705+705*(706+706*(707+707*(708+708*(709+709*(710+710*(711+711*(712+712*(713+713*(714+714*(715+715*(716+716*(717+717*(718+718*(719+719*(720+720*(721+721*(722+722*(723+723*(724+724*(725+725*(726+726*(727+727*(728+728*(729+729*(730+730*(731+731*(732+732*(733+733*(734+734*(735+735*(736+736*(737+737*(738+738*(739+739*(740+740*(741+741*(742+742*(743+743*(744+744*(745+745*(746+746*(747+747*(748+748*(749+749*(750+750*(751+751*(752+752*(753+753*(754+754*(755+755*(756+756*(757+757*(758+758*(759+759*(760+760*(761+761*(762+762*(763+763*(764+764*(765+765*(766+766*(767+767*(768+768*(769+769*(770+770*(771+771*(772+772*(773+773*(774+774*(775+775*(776+776*(777+777*(778+778*(779+779*(780+780*(781+781*(782+782*(783+783*(784+784*(785+785*(786+786*(787+787*(788+788*(789+789*(790+790*(791+791*(792+792*(793+793*(794+794*(795+795*(796+796*(797+797*(798+798*(799+799*(800+800*(801+801*(802+802*(803+803*(804+804*(805+805*(806+806*(807+807*(808+808*(809+809*(810+810*(811+811*(812+812*(813+813*(814+814*(815+815*(816+816*(817+817*(818+818*(819+819*(820+820*(821+821*(822+822*(823+823*(824+824*(825+825*(826+826*(827+827*(828+828*(829+829*(830+830*(831+831*(832+832*(833+833*(834+834*(835+835*(836+836*(837+837*(838+838*(839+839*(840+840*(841+841*(842+842*(843+843*(844+844*(845+845*(846+846*(847+847*(848+848*(849+849*(850+850*(851+851*(852+852*(853+853*(854+854*(855+855*(856+856*(857+857*(858+858*(859+859*(860+860*(861+861*(862+862*(863+863*(864+864*(865+865*(866+866*(867+867*(868+868*(869+869*(870+870*(871+871*(872+872*(873+873*(874+874*(875+875*(876+876*(877+877*(878+878*(879+879*(880+880*(881+881*(882+882*(883+883*(884+884*(885+885*(886+886*(887+887*(888+888*(889+889*(890+890*(891+891*(892+892*(893+893*(894+894*(895+895*(896+896*(897+897*(898+898*(899+899*(900+900*(901+901*(902+902*(903+903*(904+904*(905+905*(906+906*(907+907*(908+908*(909+909*(910+910*(911+911*(912+912*(913+913*(914+914*(915+915*(916+916*(917+917*(918+918*(919+919*(920+920*(921+921*(922+922*(923+923*(924+924*(925+925*(926+926*(927+927*(928+928*(929+929*(930+930*(931+931*(932+932*(933+933*(934+934*(935+935*(936+936*(937+937*(938+938*(939+939*(940+940*(941+941*(942+942*(943+943*(944+944*(945+945*(946+946*(947+947*(948+948*(949+949*(950+950*(951+951*(952+952*(953+953*(954+954*(955+955*(956+956*(957+957*(958+958*(959+959*(960+960*(961+961*(962+962*(963+963*(964+964*(965+965*(966+966*(967+967*(968+968*(969+969*(970+970*(971+971*(972+972*(973+973*(974+974*(975+975*(976+976*(977+977*(978+978*(979+979*(980+980*(981+981*(982+982*(983+983*(984+984*(985+985*(986+986*(987+987*(988+988*(989+989*(990+990*(991+991*(992+992*(993+993*(994+994*(995+995*(996+996*(997+997*(998+998*(999+999*(1000+1000*(1001))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))\n"; | |
349 | } | |
350 | } | |
351 | ||
352 | ################################################################## | |
3a2803df AD |
353 | |
354 | =item C<generate_grammar_calc ($base, $max, @directive)> | |
15129f25 | 355 | |
7e5f9c54 | 356 | Generate a Bison file F<$base.y> for a calculator parser in C. Pass |
5b421a4e | 357 | the additional Bison C<@directive>. C<$max> is ignored, but left to |
7109a18d | 358 | have the same interface as C<triangular_grammar>. |
15129f25 AD |
359 | |
360 | =cut | |
3cedc2dc | 361 | |
3a2803df | 362 | sub generate_grammar_calc ($$@) |
3cedc2dc | 363 | { |
5b421a4e AD |
364 | my ($base, $max, @directive) = @_; |
365 | my $directives = directives ($base, @directive); | |
3cedc2dc | 366 | |
f10e19fd AD |
367 | # Putting this request here is stupid, since the input will be |
368 | # generated each time we generate a grammar. | |
369 | calc_input ('calc', 200); | |
370 | ||
3cedc2dc AD |
371 | my $out = new IO::File ">$base.y" |
372 | or die; | |
373 | print $out <<EOF; | |
374 | %{ | |
459a57a9 | 375 | #include <assert.h> |
3cedc2dc | 376 | #include <stdio.h> |
3cedc2dc AD |
377 | #include <stdlib.h> |
378 | #include <string.h> | |
379 | #include <ctype.h> | |
380 | #define USE(Var) | |
381 | ||
382 | /* Exercise pre-prologue dependency to %union. */ | |
383 | typedef int semantic_value; | |
384 | ||
385 | static semantic_value global_result = 0; | |
386 | static int global_count = 0; | |
387 | %} | |
388 | ||
3cedc2dc AD |
389 | $directives |
390 | %error-verbose | |
922730fe | 391 | /* Exercise %union. */ |
3cedc2dc AD |
392 | %union |
393 | { | |
394 | semantic_value ival; | |
395 | }; | |
396 | ||
397 | %{ | |
398 | static int power (int base, int exponent); | |
399 | /* yyerror receives the location if: | |
400 | - %location & %pure & %glr | |
401 | - %location & %pure & %yacc & %parse-param. */ | |
402 | static void yyerror (const char *s); | |
403 | #if YYPURE | |
404 | static int yylex (YYSTYPE* yylvalp); | |
405 | #else | |
406 | static int yylex (void); | |
407 | #endif | |
408 | %} | |
409 | ||
410 | /* Bison Declarations */ | |
411 | %token CALC_EOF 0 "end of input" | |
412 | %token <ival> NUM "number" | |
413 | %type <ival> exp | |
414 | ||
e9690142 | 415 | %nonassoc '=' /* comparison */ |
3cedc2dc AD |
416 | %left '-' '+' |
417 | %left '*' '/' | |
418 | %left NEG /* negation--unary minus */ | |
419 | %right '^' /* exponentiation */ | |
420 | ||
421 | /* Grammar follows */ | |
422 | %% | |
423 | input: | |
424 | line | |
425 | | input line | |
426 | ; | |
427 | ||
428 | line: | |
429 | '\\n' | |
430 | | exp '\\n' { USE (\$1); } | |
431 | ; | |
432 | ||
433 | exp: | |
434 | NUM { \$\$ = \$1; } | |
435 | | exp '=' exp | |
436 | { | |
437 | if (\$1 != \$3) | |
438 | fprintf (stderr, "calc: error: %d != %d\\n", \$1, \$3); | |
439 | \$\$ = \$1; | |
440 | } | |
441 | | exp '+' exp { \$\$ = \$1 + \$3; } | |
442 | | exp '-' exp { \$\$ = \$1 - \$3; } | |
443 | | exp '*' exp { \$\$ = \$1 * \$3; } | |
444 | | exp '/' exp { \$\$ = \$1 / \$3; } | |
445 | | '-' exp %prec NEG { \$\$ = -\$2; } | |
446 | | exp '^' exp { \$\$ = power (\$1, \$3); } | |
447 | | '(' exp ')' { \$\$ = \$2; } | |
448 | | '(' error ')' { \$\$ = 1111; } | |
449 | | '!' { \$\$ = 0; YYERROR; } | |
450 | | '-' error { \$\$ = 0; YYERROR; } | |
451 | ; | |
452 | %% | |
453 | /* The input. */ | |
454 | static FILE *input; | |
455 | ||
456 | static void | |
457 | yyerror (const char *s) | |
458 | { | |
459 | fprintf (stderr, "%s\\n", s); | |
460 | } | |
461 | ||
462 | static int | |
463 | get_char (void) | |
464 | { | |
465 | return getc (input); | |
466 | } | |
467 | ||
468 | ||
469 | static void | |
470 | unget_char ( int c) | |
471 | { | |
472 | ungetc (c, input); | |
473 | } | |
474 | ||
475 | static int | |
476 | read_signed_integer (void) | |
477 | { | |
478 | int c = get_char (); | |
479 | int sign = 1; | |
480 | int n = 0; | |
481 | ||
482 | if (c == '-') | |
483 | { | |
484 | c = get_char (); | |
485 | sign = -1; | |
486 | } | |
487 | ||
488 | while (isdigit (c)) | |
489 | { | |
490 | n = 10 * n + (c - '0'); | |
491 | c = get_char (); | |
492 | } | |
493 | ||
494 | unget_char (c); | |
495 | ||
496 | return sign * n; | |
497 | } | |
498 | ||
3cedc2dc AD |
499 | static int |
500 | #if YYPURE | |
501 | # define yylval (*yylvalp) | |
502 | yylex (YYSTYPE* yylvalp) | |
503 | #else | |
504 | yylex (void) | |
505 | #endif | |
506 | { | |
507 | int c; | |
508 | ||
509 | /* Skip white space. */ | |
510 | while ((c = get_char ()) == ' ' || c == '\t') | |
0925d5bf | 511 | continue; |
3cedc2dc AD |
512 | |
513 | /* process numbers */ | |
514 | if (c == '.' || isdigit (c)) | |
515 | { | |
516 | unget_char ( c); | |
517 | yylval.ival = read_signed_integer (); | |
518 | return NUM; | |
519 | } | |
520 | ||
521 | /* Return end-of-file. */ | |
522 | if (c == EOF) | |
523 | return CALC_EOF; | |
524 | ||
525 | /* Return single chars. */ | |
526 | return c; | |
527 | } | |
528 | ||
529 | static int | |
530 | power (int base, int exponent) | |
531 | { | |
d0f2b7f8 | 532 | assert (0 <= exponent); |
3cedc2dc | 533 | int res = 1; |
3cedc2dc AD |
534 | for (/* Niente */; exponent; --exponent) |
535 | res *= base; | |
536 | return res; | |
537 | } | |
538 | ||
539 | ||
3cedc2dc AD |
540 | int |
541 | main (int argc, const char **argv) | |
542 | { | |
543 | semantic_value result = 0; | |
544 | int count = 0; | |
545 | int status; | |
546 | ||
37318e2f JD |
547 | #if YYDEBUG |
548 | yydebug = !!getenv ("YYDEBUG"); | |
549 | #endif | |
550 | ||
3cedc2dc AD |
551 | input = fopen ("calc.input", "r"); |
552 | if (!input) | |
553 | { | |
554 | perror ("calc.input"); | |
555 | return 3; | |
556 | } | |
557 | ||
558 | status = yyparse (); | |
559 | if (global_result != result) | |
560 | abort (); | |
561 | if (global_count != count) | |
562 | abort (); | |
563 | ||
564 | return status; | |
565 | } | |
566 | EOF | |
567 | } | |
568 | ||
569 | ################################################################## | |
570 | ||
f10e19fd | 571 | =item C<generate_grammar_list ($base, $max, @directive)> |
7109a18d | 572 | |
f10e19fd AD |
573 | Generate a Bison file F<$base.y> for a C++ parser that uses C++ |
574 | objects (std::string, std::list). Tailored for using %define variant. | |
7109a18d AD |
575 | |
576 | =cut | |
577 | ||
f10e19fd | 578 | sub generate_grammar_list ($$@) |
7109a18d | 579 | { |
5b421a4e AD |
580 | my ($base, $max, @directive) = @_; |
581 | my $directives = directives ($base, @directive); | |
6e097787 | 582 | my $variant = grep { /%define "?variant"?/ } @directive; |
e36ec1f4 | 583 | my $token_ctor = grep { /%define "?api.token.constructor"?/ } @directive; |
7109a18d AD |
584 | my $out = new IO::File ">$base.y" |
585 | or die; | |
586 | print $out <<EOF; | |
7109a18d AD |
587 | %language "C++" |
588 | %defines | |
09277875 | 589 | %locations |
5b421a4e | 590 | $directives |
7109a18d | 591 | |
f10e19fd | 592 | %code requires // *.h |
7109a18d AD |
593 | { |
594 | #include <string> | |
595 | } | |
596 | ||
f10e19fd | 597 | %code // *.c |
7109a18d AD |
598 | { |
599 | #include <algorithm> | |
600 | #include <iostream> | |
601 | #include <sstream> | |
602 | ||
3a2803df | 603 | #define STAGE_MAX ($max * 10) // max = $max |
c85be41a | 604 | |
e36ec1f4 | 605 | #define USE_TOKEN_CTOR $token_ctor |
7109a18d | 606 | #define USE_VARIANTS $variant |
c85be41a | 607 | |
09277875 AD |
608 | // Prototype of the yylex function providing subsequent tokens. |
609 | static | |
e36ec1f4 | 610 | #if USE_TOKEN_CTOR |
09277875 | 611 | yy::parser::symbol_type yylex(); |
c85be41a | 612 | #else |
492dacbc TR |
613 | yy::parser::token_type yylex(yy::parser::semantic_type* yylvalp, |
614 | yy::parser::location_type* yyllocp); | |
c85be41a | 615 | #endif |
918eb7c5 AD |
616 | |
617 | // Conversion to string. | |
618 | template <typename T> | |
619 | inline | |
620 | std::string | |
621 | string_cast (const T& t) | |
622 | { | |
623 | std::ostringstream o; | |
624 | o << t; | |
625 | return o.str (); | |
626 | } | |
7109a18d | 627 | } |
09277875 AD |
628 | |
629 | %token END_OF_FILE 0 | |
7109a18d AD |
630 | EOF |
631 | ||
632 | if ($variant) | |
633 | { | |
634 | print $out <<'EOF'; | |
7109a18d AD |
635 | %token <std::string> TEXT |
636 | %token <int> NUMBER | |
637 | %printer { std::cerr << "Number: " << $$; } <int> | |
638 | %printer { std::cerr << "Text: " << $$; } <std::string> | |
7109a18d AD |
639 | %type <std::string> text result |
640 | ||
641 | %% | |
642 | result: | |
e9690142 | 643 | text { /* Throw away the result. */ } |
7109a18d AD |
644 | ; |
645 | ||
646 | text: | |
e9690142 JD |
647 | /* nothing */ { /* This will generate an empty string */ } |
648 | | text TEXT { std::swap ($$, $2); } | |
649 | | text NUMBER { $$ = string_cast($2); } | |
7109a18d AD |
650 | ; |
651 | EOF | |
652 | } | |
653 | else | |
654 | { | |
8901f32e | 655 | # Not using Bison variants. |
7109a18d AD |
656 | print $out <<'EOF'; |
657 | %union {int ival; std::string* sval;} | |
658 | %token <sval> TEXT | |
659 | %token <ival> NUMBER | |
660 | %printer { std::cerr << "Number: " << $$; } <ival> | |
661 | %printer { std::cerr << "Text: " << *$$; } <sval> | |
7109a18d AD |
662 | %type <sval> text result |
663 | ||
664 | %% | |
665 | result: | |
e9690142 | 666 | text { delete $1; } |
7109a18d AD |
667 | ; |
668 | ||
669 | text: | |
e9690142 JD |
670 | /* nothing */ { $$ = new std::string; } |
671 | | text TEXT { delete $1; $$ = $2; } | |
672 | | text NUMBER { delete $1; $$ = new std::string (string_cast ($2)); } | |
7109a18d AD |
673 | ; |
674 | EOF | |
675 | } | |
676 | ||
677 | print $out <<'EOF'; | |
678 | %% | |
09277875 AD |
679 | # |
680 | ||
7109a18d | 681 | static |
e36ec1f4 | 682 | #if USE_TOKEN_CTOR |
09277875 AD |
683 | yy::parser::symbol_type yylex() |
684 | #else | |
492dacbc TR |
685 | yy::parser::token_type yylex(yy::parser::semantic_type* yylvalp, |
686 | yy::parser::location_type* yyllocp) | |
09277875 | 687 | #endif |
7109a18d | 688 | { |
4fc55348 | 689 | typedef yy::parser::location_type location_type; |
09277875 | 690 | typedef yy::parser::token token; |
7109a18d AD |
691 | static int stage = -1; |
692 | ++stage; | |
693 | if (stage == STAGE_MAX) | |
09277875 | 694 | { |
e36ec1f4 | 695 | #if USE_TOKEN_CTOR |
07a6e87d | 696 | return yy::parser::make_END_OF_FILE (location_type ()); |
09277875 | 697 | #else |
492dacbc | 698 | *yyllocp = location_type (); |
09277875 AD |
699 | return token::END_OF_FILE; |
700 | #endif | |
701 | } | |
7109a18d AD |
702 | else if (stage % 2) |
703 | { | |
e36ec1f4 | 704 | #if USE_TOKEN_CTOR |
07a6e87d | 705 | return yy::parser::make_NUMBER (stage, location_type ()); |
4fc55348 AD |
706 | #else |
707 | # if defined ONE_STAGE_BUILD | |
492dacbc | 708 | yylvalp->build(stage); |
4fc55348 | 709 | # elif USE_VARIANTS |
492dacbc | 710 | yylvalp->build<int>() = stage; |
4fc55348 | 711 | # else |
492dacbc | 712 | yylvalp->ival = stage; |
4fc55348 | 713 | # endif |
492dacbc | 714 | *yyllocp = location_type (); |
09277875 | 715 | return token::NUMBER; |
c85be41a | 716 | #endif |
7109a18d AD |
717 | } |
718 | else | |
719 | { | |
e36ec1f4 | 720 | #if USE_TOKEN_CTOR |
07a6e87d | 721 | return yy::parser::make_TEXT ("A string.", location_type ()); |
4fc55348 AD |
722 | #else |
723 | # if defined ONE_STAGE_BUILD | |
492dacbc | 724 | yylvalp->build(std::string("A string.")); |
4fc55348 | 725 | # elif USE_VARIANTS |
492dacbc | 726 | yylvalp->build<std::string>() = std::string("A string."); |
4fc55348 | 727 | # else |
492dacbc | 728 | yylvalp->sval = new std::string("A string."); |
4fc55348 | 729 | # endif |
492dacbc | 730 | *yyllocp = location_type (); |
09277875 | 731 | return token::TEXT; |
c85be41a | 732 | #endif |
7109a18d AD |
733 | } |
734 | abort(); | |
735 | } | |
736 | ||
737 | // Mandatory error function | |
738 | void | |
07a6e87d | 739 | yy::parser::error(const yy::parser::location_type& loc, const std::string& msg) |
7109a18d | 740 | { |
07a6e87d | 741 | std::cerr << loc << ": " << msg << std::endl; |
7109a18d AD |
742 | } |
743 | ||
744 | int main(int argc, char *argv[]) | |
745 | { | |
746 | yy::parser p; | |
5b421a4e | 747 | #if YYDEBUG |
7109a18d | 748 | p.set_debug_level(!!getenv("YYDEBUG")); |
5b421a4e | 749 | #endif |
7109a18d AD |
750 | p.parse(); |
751 | return 0; | |
752 | } | |
753 | EOF | |
754 | } | |
755 | ||
756 | ################################################################## | |
757 | ||
3a2803df AD |
758 | =item C<generate_grammar ($name, $base, @directive)> |
759 | ||
760 | Generate F<$base.y> by calling C<&generate_grammar_$name>. | |
761 | ||
762 | =cut | |
763 | ||
764 | sub generate_grammar ($$@) | |
765 | { | |
766 | my ($name, $base, @directive) = @_; | |
c85be41a | 767 | verbose 3, "Generating $base.y\n"; |
3a2803df AD |
768 | my %generator = |
769 | ( | |
770 | "calc" => \&generate_grammar_calc, | |
f10e19fd | 771 | "list" => \&generate_grammar_list, |
3a2803df | 772 | "triangular" => \&generate_grammar_triangular, |
3a2803df AD |
773 | ); |
774 | &{$generator{$name}}($base, 200, @directive); | |
775 | } | |
776 | ||
777 | ################################################################## | |
778 | ||
779 | =item C<run ($command)> | |
780 | ||
781 | Run, possibly verbosely, the shell C<$command>. | |
782 | ||
783 | =cut | |
784 | ||
785 | sub run ($) | |
786 | { | |
787 | my ($command) = @_; | |
c85be41a | 788 | verbose 3, "$command\n"; |
3a2803df AD |
789 | system ("$command") == 0 |
790 | or die "$command failed"; | |
791 | } | |
792 | ||
793 | ################################################################## | |
794 | ||
15129f25 AD |
795 | =item C<compile ($base)> |
796 | ||
7109a18d AD |
797 | Compile C<$base.y> to an executable C, Using the C or C++ compiler |
798 | depending on the %language specification in C<$base.y>. | |
15129f25 AD |
799 | |
800 | =cut | |
801 | ||
3cedc2dc AD |
802 | sub compile ($) |
803 | { | |
804 | my ($base) = @_; | |
7109a18d AD |
805 | my $language = `sed -ne '/%language "\\(.*\\)"/{s//\\1/;p;q;}' $base.y`; |
806 | chomp $language; | |
807 | ||
808 | my $compiler = $language eq 'C++' ? $cxx : $cc; | |
809 | ||
ca42755f TR |
810 | my $my_bison = `sed -ne '/%bison "\\(.*\\)"/{s//\\1/;p;q;}' $base.y`; |
811 | run ((length $my_bison ? $my_bison : $bison) . " $base.y -o $base.c"); | |
3a2803df | 812 | run "$compiler -o $base $cflags $base.c"; |
3cedc2dc AD |
813 | } |
814 | ||
3a2803df AD |
815 | ###################################################################### |
816 | ||
f10e19fd | 817 | =item C<bench ($grammar, @token)> |
15129f25 | 818 | |
f10e19fd AD |
819 | Generate benches for the C<$grammar> and the directive specification |
820 | given in the list of C<@token>. | |
15129f25 AD |
821 | |
822 | =cut | |
823 | ||
f10e19fd | 824 | sub bench ($@) |
3cedc2dc | 825 | { |
f10e19fd | 826 | my ($grammar, @token) = @_; |
d11ee647 AD |
827 | use Benchmark qw (:all :hireswallclock); |
828 | ||
f10e19fd AD |
829 | my @directive = parse (@token); |
830 | ||
7484f1d4 | 831 | # Set up the benches as expected by timethese. |
3cedc2dc | 832 | my %bench; |
757f8f98 AD |
833 | # A counter of directive sets. |
834 | my $count = 1; | |
835 | for my $d (@directive) | |
3cedc2dc | 836 | { |
f10e19fd AD |
837 | $bench{$count} = $d; |
838 | printf " %2d. %s\n", $count, join (' ', split ("\n", $d)); | |
757f8f98 | 839 | $count++; |
f10e19fd AD |
840 | }; |
841 | ||
842 | # For each bench, capture the size. | |
843 | my %size; | |
757f8f98 | 844 | |
f10e19fd | 845 | while (my ($name, $directives) = each %bench) |
757f8f98 | 846 | { |
f10e19fd AD |
847 | generate_grammar ($grammar, $name, $directives); |
848 | # Compile the executable. | |
849 | compile ($name); | |
850 | $bench{$name} = "system ('./$name');"; | |
851 | chop($size{$name} = `wc -c <$name`); | |
3cedc2dc AD |
852 | } |
853 | ||
7484f1d4 | 854 | # Run the benches. |
d11ee647 AD |
855 | # |
856 | # STYLE can be any of 'all', 'none', 'noc', 'nop' or 'auto'. 'all' | |
857 | # shows each of the 5 times available ('wallclock' time, user time, | |
858 | # system time, user time of children, and system time of | |
859 | # children). 'noc' shows all except the two children times. 'nop' | |
860 | # shows only wallclock and the two children times. 'auto' (the | |
861 | # default) will act as 'all' unless the children times are both | |
862 | # zero, in which case it acts as 'noc'. 'none' prevents output. | |
c85be41a | 863 | verbose 3, "Running the benches for $grammar\n"; |
7e5f9c54 | 864 | my $res = timethese ($iterations, \%bench, 'nop'); |
d11ee647 AD |
865 | |
866 | # Output the speed result. | |
3cedc2dc | 867 | cmpthese ($res, 'nop'); |
d11ee647 AD |
868 | |
869 | # Display the sizes. | |
cac9e09b | 870 | print "Sizes (decreasing):\n"; |
0cc5bead | 871 | my $width = 10; |
d11ee647 AD |
872 | for my $bench (keys %size) |
873 | { | |
0cc5bead AD |
874 | $width = length $bench |
875 | if $width < length $bench; | |
876 | } | |
cac9e09b AD |
877 | # Benches sorted by decreasing size. |
878 | my @benches_per_size = sort {$size{$b} <=> $size{$a}} keys %size; | |
879 | for my $bench (@benches_per_size) | |
0cc5bead | 880 | { |
cac9e09b | 881 | printf "%${width}s: %5.2fkB\n", $bench, $size{$bench} / 1024; |
d11ee647 | 882 | } |
3cedc2dc AD |
883 | } |
884 | ||
3a2803df | 885 | ###################################################################### |
7484f1d4 AD |
886 | |
887 | =item C<bench_push_parser ()> | |
888 | ||
889 | Bench the C push parser against the pull parser, pure and impure | |
890 | interfaces. | |
891 | ||
892 | =cut | |
893 | ||
894 | sub bench_push_parser () | |
895 | { | |
f10e19fd | 896 | bench ('calc', |
fce629c0 AD |
897 | qw( |
898 | [ %d api.pure ] | |
899 | & | |
67212941 | 900 | [ %d api.push-pull=both ] |
f10e19fd | 901 | )); |
7484f1d4 AD |
902 | } |
903 | ||
3a2803df AD |
904 | ###################################################################### |
905 | ||
7109a18d AD |
906 | =item C<bench_variant_parser ()> |
907 | ||
09277875 | 908 | Bench the C++ lalr1.cc parser using variants or %union. |
7109a18d AD |
909 | |
910 | =cut | |
911 | ||
912 | sub bench_variant_parser () | |
913 | { | |
c85be41a | 914 | bench ('list', |
c17f9a4a | 915 | qw( |
09277875 AD |
916 | [ |
917 | %d variant | |
c17f9a4a | 918 | & |
e36ec1f4 | 919 | [ #d ONE_STAGE_BUILD | %d api.token.constructor ] |
c17f9a4a AD |
920 | ] |
921 | ) | |
922 | ); | |
7109a18d AD |
923 | } |
924 | ||
925 | ############################################################################ | |
926 | ||
7e5f9c54 AD |
927 | sub help ($) |
928 | { | |
929 | my ($verbose) = @_; | |
930 | use Pod::Usage; | |
931 | # See <URL:http://perldoc.perl.org/pod2man.html#NOTES>. | |
932 | pod2usage( { -message => "Bench Bison parsers", | |
933 | -exitval => 0, | |
934 | -verbose => $verbose, | |
935 | -output => \*STDOUT }); | |
936 | } | |
937 | ||
3a2803df AD |
938 | ###################################################################### |
939 | ||
fce629c0 AD |
940 | # The end of the directives to parse. |
941 | my $eod = "end of directives"; | |
f10e19fd AD |
942 | # The list of tokens parsed by the following functions. |
943 | my @token; | |
944 | ||
fce629c0 AD |
945 | # eat ($EXPECTED) |
946 | # --------------- | |
947 | # Check that the current token is $EXPECTED, and move to the next. | |
948 | sub eat ($) | |
949 | { | |
950 | my ($expected) = @_; | |
951 | die "expected $expected, unexpected: $token[0] (@token)\n" | |
952 | unless $token[0] eq $expected; | |
953 | shift @token; | |
954 | } | |
955 | ||
f10e19fd AD |
956 | # Parse directive specifications: |
957 | # expr: term (| term)* | |
958 | # term: fact (& fact)* | |
959 | # fact: ( expr ) | [ expr ] | dirs | |
fce629c0 | 960 | # dirs: %s SKELETON | #d NAME[=VALUE] | %d NAME[=VALUE] | directive |
f10e19fd AD |
961 | sub parse (@) |
962 | { | |
fce629c0 | 963 | @token = (@_, $eod); |
c85be41a | 964 | verbose 3, "Parsing: @token\n"; |
db65ca1f | 965 | my @res = parse_expr (); |
fce629c0 | 966 | eat ($eod); |
db65ca1f | 967 | return @res; |
f10e19fd AD |
968 | } |
969 | ||
970 | sub parse_expr () | |
971 | { | |
972 | my @res = parse_term (); | |
fce629c0 | 973 | while ($token[0] eq '|') |
f10e19fd | 974 | { |
fce629c0 | 975 | eat ('|'); |
f10e19fd AD |
976 | # Alternation. |
977 | push @res, parse_term (); | |
978 | } | |
979 | return @res; | |
980 | } | |
981 | ||
982 | sub parse_term () | |
983 | { | |
984 | my @res = parse_fact (); | |
fce629c0 | 985 | while ($token[0] eq '&') |
f10e19fd | 986 | { |
fce629c0 | 987 | eat ('&'); |
f10e19fd AD |
988 | # Cartesian product. |
989 | my @lhs = @res; | |
990 | @res = (); | |
991 | for my $rhs (parse_fact ()) | |
992 | { | |
993 | for my $lhs (@lhs) | |
994 | { | |
2722aa42 | 995 | push @res, $lhs . ($lhs && $rhs ? "\n" : "") . $rhs; |
f10e19fd AD |
996 | } |
997 | } | |
998 | } | |
999 | return @res; | |
1000 | } | |
1001 | ||
1002 | sub parse_fact () | |
1003 | { | |
1004 | my @res; | |
1005 | die "unexpected end of expression" | |
1006 | unless defined $token[0]; | |
1007 | ||
1008 | if ($token[0] eq '(') | |
1009 | { | |
fce629c0 | 1010 | eat ('('); |
f10e19fd | 1011 | @res = parse_expr (); |
fce629c0 | 1012 | eat (')'); |
f10e19fd AD |
1013 | } |
1014 | elsif ($token[0] eq '[') | |
1015 | { | |
fce629c0 | 1016 | eat ('['); |
f10e19fd | 1017 | @res = (parse_expr (), ''); |
fce629c0 | 1018 | eat (']'); |
f10e19fd | 1019 | } |
c17f9a4a AD |
1020 | else |
1021 | { | |
1022 | @res = parse_dirs (); | |
1023 | } | |
1024 | return @res; | |
1025 | } | |
1026 | ||
1027 | sub parse_dirs () | |
1028 | { | |
1029 | my @res; | |
1030 | die "unexpected end of expression" | |
1031 | unless defined $token[0]; | |
1032 | ||
1033 | if ($token[0] eq '#d') | |
fce629c0 AD |
1034 | { |
1035 | eat ('#d'); | |
1036 | $token[0] =~ s/(.*?)=(.*)/$1 $2/; | |
1037 | @res = ("%code {\n#define $token[0]\n}"); | |
1038 | shift @token; | |
1039 | } | |
1040 | elsif ($token[0] eq '%d') | |
c17f9a4a AD |
1041 | { |
1042 | shift @token; | |
fce629c0 AD |
1043 | $token[0] =~ s/(.*?)=(.*)/$1 "$2"/; |
1044 | @res = ("%define $token[0]"); | |
c17f9a4a AD |
1045 | shift @token; |
1046 | } | |
1047 | elsif ($token[0] eq '%s') | |
1048 | { | |
1049 | shift @token; | |
1050 | @res = ("%skeleton \"$token[0]\""); | |
1051 | shift @token; | |
1052 | } | |
ca42755f TR |
1053 | elsif ($token[0] eq '%b') |
1054 | { | |
1055 | shift @token; | |
1056 | @res = ("/*\n%bison \"$token[0]\"\\\n*/"); | |
1057 | shift @token; | |
1058 | } | |
f10e19fd AD |
1059 | else |
1060 | { | |
1061 | @res = $token[0]; | |
1062 | shift @token; | |
1063 | } | |
c17f9a4a | 1064 | |
f10e19fd AD |
1065 | return @res; |
1066 | } | |
1067 | ||
1068 | ###################################################################### | |
1069 | ||
7e5f9c54 AD |
1070 | sub getopt () |
1071 | { | |
1072 | use Getopt::Long; | |
3a2803df | 1073 | my %option = ( |
f10e19fd | 1074 | "b|bench=s" => \$bench, |
a6df593d | 1075 | "c|cflags=s" => \$cflags, |
757f8f98 | 1076 | "d|directive=s" => \@directive, |
f10e19fd | 1077 | "g|grammar=s" => \$grammar, |
a6df593d AD |
1078 | "h|help" => sub { help ($verbose) }, |
1079 | "i|iterations=i" => \$iterations, | |
ef05c4d6 | 1080 | "q|quiet" => sub { --$verbose }, |
a6df593d AD |
1081 | "v|verbose" => sub { ++$verbose }, |
1082 | ); | |
7e5f9c54 AD |
1083 | Getopt::Long::Configure ("bundling", "pass_through"); |
1084 | GetOptions (%option) | |
1085 | or exit 1; | |
1086 | } | |
1087 | ||
1088 | ###################################################################### | |
1089 | ||
1090 | getopt; | |
c85be41a AD |
1091 | |
1092 | # Create the directory we work in. | |
c17f9a4a AD |
1093 | mkdir "benches" or die "cannot create benches" |
1094 | unless -d "benches"; | |
c85be41a AD |
1095 | my $count = 1; |
1096 | ++$count | |
c17f9a4a AD |
1097 | while -d "benches/$count"; |
1098 | my $dir = "benches/$count"; | |
c85be41a AD |
1099 | mkdir $dir |
1100 | or die "cannot create $dir"; | |
1101 | chdir $dir | |
1102 | or die "cannot chdir $dir"; | |
c17f9a4a | 1103 | |
6e097787 AD |
1104 | # The following message is tailored to please Emacs' compilation-mode. |
1105 | verbose 1, "Entering directory `$dir'\n"; | |
e1b74b92 | 1106 | verbose 1, "Using bison=$bison.\n"; |
c85be41a AD |
1107 | verbose 2, "Using cc=$cc.\n"; |
1108 | verbose 2, "Using cxx=$cxx.\n"; | |
1109 | verbose 2, "Using cflags=$cflags.\n"; | |
f10e19fd AD |
1110 | verbose 2, "Grammar: $grammar\n"; |
1111 | ||
a6df593d | 1112 | |
c85be41a AD |
1113 | # Support -b: predefined benches. |
1114 | my %bench = | |
1115 | ( | |
c85be41a AD |
1116 | "push" => \&bench_push_parser, |
1117 | "variant" => \&bench_variant_parser, | |
1118 | ); | |
1119 | ||
1120 | if (defined $bench) | |
1121 | { | |
1122 | die "invalid argument for --bench: $bench" | |
1123 | unless defined $bench{$bench}; | |
1124 | &{$bench{$bench}}(); | |
1125 | exit 0; | |
1126 | } | |
1127 | else | |
1128 | { | |
1129 | # Launch the bench marking. | |
1130 | bench ($grammar, @ARGV); | |
1131 | } | |
3cedc2dc AD |
1132 | |
1133 | ### Setup "GNU" style for perl-mode and cperl-mode. | |
1134 | ## Local Variables: | |
1135 | ## perl-indent-level: 2 | |
1136 | ## perl-continued-statement-offset: 2 | |
1137 | ## perl-continued-brace-offset: 0 | |
1138 | ## perl-brace-offset: 0 | |
1139 | ## perl-brace-imaginary-offset: 0 | |
1140 | ## perl-label-offset: -2 | |
1141 | ## cperl-indent-level: 2 | |
1142 | ## cperl-brace-offset: 0 | |
1143 | ## cperl-continued-brace-offset: 0 | |
1144 | ## cperl-label-offset: -2 | |
1145 | ## cperl-extra-newline-before-brace: t | |
1146 | ## cperl-merge-trailing-else: nil | |
1147 | ## cperl-continued-statement-offset: 2 | |
1148 | ## End: |