~ubuntu-branches/ubuntu/trusty/happy/trusty-proposed

Viewing changes to src/LALR.lhs

Committer: Bazaar Package Importer
Author(s): Ian Lynagh (wibble)
Date: 2006-10-26 22:52:14 UTC
mfrom: (1.2.2 upstream) (3.1.1 dapper)
Revision ID: james.westby@ubuntu.com-20061026225214-6jmf0n3ykkc9elyw

Tags: 1.16~rc2-1

http://bugs.debian.org/340325

http://bugs.debian.org/332979

* New upstream (release candidate) version.
* Removed happy/ prefixes from various paths in debian/rules and
  debian/docs.
* doc/configure generated by autoconf is in the Debian diff.
* Build using cabal:
  * Various debian/rules changes.
  * Create debian/get_version.hs for extracting the version from the cabal
    file.
  * Requires ghc6 >= 6.4.2.
  * No longer tries to detect platform. Closes: #340325, #332979.
  * Removed autotool-dev build-dep.
* Add 'XSLTPROC_OPTS = --nonet' to doc/config.mk.in.
* Remove src/Parser.ly and src/AttrGrammarParser.ly before cleaning so
  the generated files don't get cleaned.
* Set Standards-Version to 3.7.2 (no changes needed).
* Removed PS and DVI stanzas from debian/doc-base as we don't build
  the documentation those ways.
* Removed content-free postinst and prerm.

files added:
ANNOUNCE

CHANGES

InstallShield

InstallShield/Component Definitions

InstallShield/Component Definitions/Default.cdf

InstallShield/Component Definitions/Default.fgl

InstallShield/File Groups

InstallShield/File Groups/Default.fdf

InstallShield/File Groups/Help Files.fgl

InstallShield/File Groups/Program Executable Files.fgl

InstallShield/Happy.ipr

InstallShield/Registry Entries

InstallShield/Registry Entries/Default.rge

InstallShield/Script Files

InstallShield/Script Files/Setup.Inx

InstallShield/Script Files/Setup.Obs

InstallShield/Script Files/Setup.dbg

InstallShield/Script Files/Setup.ino

InstallShield/Script Files/Setup.ins

InstallShield/Script Files/Setup.map

InstallShield/Script Files/setup.rul

InstallShield/Setup Files

InstallShield/Setup Files/Compressed Files

InstallShield/Setup Files/Compressed Files/Language Independent

InstallShield/Setup Files/Compressed Files/Language Independent/OS Independent

InstallShield/Setup Files/Compressed Files/Language Independent/OS Independent/ANNOUNCE

InstallShield/Setup Files/Uncompressed Files

InstallShield/Setup Files/Uncompressed Files/Language Independent

InstallShield/Setup Files/Uncompressed Files/Language Independent/OS Independent

InstallShield/Setup Files/Uncompressed Files/Language Independent/OS Independent/setup.bmp

InstallShield/Shell Objects

InstallShield/Shell Objects/Default.shl

InstallShield/String Tables

InstallShield/String Tables/0009-English

InstallShield/String Tables/0009-English/value.shl

InstallShield/String Tables/Default.shl

InstallShield/Text Substitutions

InstallShield/Text Substitutions/Build.tsb

InstallShield/Text Substitutions/Setup.tsb

LICENSE

Setup.lhs

TODO

debian/get_version.hs

doc/Makefile

doc/aclocal.m4

doc/config.mk.in

doc/configure

doc/configure.ac

doc/docbook-xml.mk

doc/fptools.css

doc/happy.1.in

doc/happy.xml

examples

examples/Calc.ly

examples/DavesExample.ly

examples/ErlParser.ly

examples/ErrorTest.ly

examples/LexerTest.ly

examples/MonadTest.ly

examples/PgnParser.ly

examples/README

examples/SimonsExample.ly

examples/glr

examples/glr/Makefile

examples/glr/Makefile.defs

examples/glr/bio-eg

examples/glr/bio-eg/1-1200.dna

examples/glr/bio-eg/1-600.dna

examples/glr/bio-eg/Bio.y

examples/glr/bio-eg/Main.lhs

examples/glr/bio-eg/Makefile

examples/glr/bio-eg/README

examples/glr/common

examples/glr/common/DV_lhs

examples/glr/common/DaVinciTypes.hs

examples/glr/expr-eval

examples/glr/expr-eval/Expr.y

examples/glr/expr-eval/Hugs.lhs

examples/glr/expr-eval/Main.lhs

examples/glr/expr-eval/Makefile

examples/glr/expr-eval/README

examples/glr/expr-monad

examples/glr/expr-monad/Expr.y

examples/glr/expr-monad/Hugs.lhs

examples/glr/expr-monad/Main.lhs

examples/glr/expr-monad/Makefile

examples/glr/expr-monad/README

examples/glr/expr-tree

examples/glr/expr-tree/Expr.y

examples/glr/expr-tree/Hugs.lhs

examples/glr/expr-tree/Main.lhs

examples/glr/expr-tree/Makefile

examples/glr/expr-tree/README

examples/glr/expr-tree/Tree.lhs

examples/glr/hidden-leftrec

examples/glr/hidden-leftrec/Expr.y

examples/glr/hidden-leftrec/Hugs.lhs

examples/glr/hidden-leftrec/Main.lhs

examples/glr/hidden-leftrec/Makefile

examples/glr/hidden-leftrec/README

examples/glr/highly-ambiguous

examples/glr/highly-ambiguous/Expr.y

examples/glr/highly-ambiguous/Hugs.lhs

examples/glr/highly-ambiguous/Main.lhs

examples/glr/highly-ambiguous/Makefile

examples/glr/highly-ambiguous/README

examples/glr/nlp

examples/glr/nlp/English.y

examples/glr/nlp/Hugs.lhs

examples/glr/nlp/Main.lhs

examples/glr/nlp/Makefile

examples/glr/nlp/README

examples/glr/packing

examples/glr/packing/Expr.y

examples/glr/packing/Hugs.lhs

examples/glr/packing/Main.lhs

examples/glr/packing/Makefile

examples/glr/packing/README

examples/igloo

examples/igloo/Foo.hs

examples/igloo/Lexer.hs

examples/igloo/Lexer.x

examples/igloo/Makefile

examples/igloo/Parser.hs

examples/igloo/Parser.y

examples/igloo/ParserM.hs

examples/igloo/README

happy.cabal

happy.spec

src/ARRAY-NOTES

src/AbsSyn.lhs

src/AttrGrammar.lhs

src/AttrGrammarParser.hs

src/AttrGrammarParser.ly

src/First.lhs

src/GenUtils.lhs

src/Grammar.lhs

src/Info.lhs

src/LALR.lhs

src/Lexer.lhs

src/Main.lhs

src/ParseMonad.lhs

src/Parser.hs

src/Parser.ly

src/ProduceCode.lhs

src/ProduceGLRCode.lhs

src/Set.hs

src/Target.lhs

templates

templates/GLR_Base.lhs

templates/GLR_Lib.lhs

templates/GenericTemplate.hs

tests

tests/Makefile

tests/Partial.ly

tests/Test.ly

tests/TestMulti.ly

tests/TestPrecedence.ly

tests/bogus-token.y

tests/bug001.ly

tests/bug002.y

tests/monad001.y

tests/monad002.ly

tests/precedence001.ly

tests/precedence002.y

files removed:
aclocal.m4

config.guess

config.sub

configure

configure.ac

debian/postinst

debian/prerm

distrib

distrib/INSTALL

distrib/Makefile-bin.in

distrib/configure-bin.ac

distrib/cross-port

distrib/cvs-build

distrib/fake-happy

distrib/hc-build

distrib/prep-bin-dist-mingw

distrib/prep-bin-dist-mingw-alex

distrib/prep-bin-dist-mingw-args

distrib/prep-bin-dist-mingw-greencard

distrib/prep-bin-dist-mingw-haddock

distrib/prep-bin-dist-mingw-happy

distrib/prep-bin-dist-mingw-hdirect

docs

docs/Makefile

docs/building

docs/building/Makefile

docs/building/building.xml

docs/coding-style.html

docs/docbook-cheat-sheet

docs/docbook-cheat-sheet/Makefile

docs/docbook-cheat-sheet/docbook-cheat-sheet.xml

docs/ffi-art

docs/hep

docs/hep/hep.tex

glafp-utils

glafp-utils/Makefile

glafp-utils/PATCHLEVEL

glafp-utils/README

glafp-utils/genargs

glafp-utils/genargs/Makefile

glafp-utils/genargs/genargs.pl

glafp-utils/lndir

glafp-utils/lndir/Makefile

glafp-utils/lndir/lndir-Xos.h

glafp-utils/lndir/lndir-Xosdefs.h

glafp-utils/lndir/lndir.c

glafp-utils/ltx

glafp-utils/ltx/Makefile

glafp-utils/ltx/ltx.prl

glafp-utils/mk

glafp-utils/mk/boilerplate.mk

glafp-utils/mk/target.mk

glafp-utils/mkdependC

glafp-utils/mkdependC/Makefile

glafp-utils/mkdependC/mkdependC.prl

glafp-utils/mkdirhier

glafp-utils/mkdirhier/Makefile

glafp-utils/mkdirhier/mkdirhier.sh

glafp-utils/nofib-analyse

glafp-utils/nofib-analyse/CmdLine.hs

glafp-utils/nofib-analyse/GenUtils.lhs

glafp-utils/nofib-analyse/Main.hs

glafp-utils/nofib-analyse/Makefile

glafp-utils/nofib-analyse/Printf.lhs

glafp-utils/nofib-analyse/Slurp.hs

glafp-utils/runstdtest

glafp-utils/runstdtest/Makefile

glafp-utils/runstdtest/runstdtest.prl

glafp-utils/sgmlverb

glafp-utils/sgmlverb/Makefile

glafp-utils/sgmlverb/sgmlverb.lex

glafp-utils/verbatim

glafp-utils/verbatim/Makefile

glafp-utils/verbatim/verbatim.lex

happy

happy/ANNOUNCE

happy/CHANGES

happy/InstallShield

happy/InstallShield/Component Definitions

happy/InstallShield/Component Definitions/Default.cdf

happy/InstallShield/Component Definitions/Default.fgl

happy/InstallShield/File Groups

happy/InstallShield/File Groups/Default.fdf

happy/InstallShield/File Groups/Help Files.fgl

happy/InstallShield/File Groups/Program Executable Files.fgl

happy/InstallShield/Happy.ipr

happy/InstallShield/Registry Entries

happy/InstallShield/Registry Entries/Default.rge

happy/InstallShield/Script Files

happy/InstallShield/Script Files/Setup.Inx

happy/InstallShield/Script Files/Setup.Obs

happy/InstallShield/Script Files/Setup.dbg

happy/InstallShield/Script Files/Setup.ino

happy/InstallShield/Script Files/Setup.ins

happy/InstallShield/Script Files/Setup.map

happy/InstallShield/Script Files/setup.rul

happy/InstallShield/Setup Files

happy/InstallShield/Setup Files/Compressed Files

happy/InstallShield/Setup Files/Compressed Files/Language Independent

happy/InstallShield/Setup Files/Compressed Files/Language Independent/OS Independent

happy/InstallShield/Setup Files/Compressed Files/Language Independent/OS Independent/ANNOUNCE

happy/InstallShield/Setup Files/Uncompressed Files

happy/InstallShield/Setup Files/Uncompressed Files/Language Independent

happy/InstallShield/Setup Files/Uncompressed Files/Language Independent/OS Independent

happy/InstallShield/Setup Files/Uncompressed Files/Language Independent/OS Independent/setup.bmp

happy/InstallShield/Shell Objects

happy/InstallShield/Shell Objects/Default.shl

happy/InstallShield/String Tables

happy/InstallShield/String Tables/0009-English

happy/InstallShield/String Tables/0009-English/value.shl

happy/InstallShield/String Tables/Default.shl

happy/InstallShield/Text Substitutions

happy/InstallShield/Text Substitutions/Build.tsb

happy/InstallShield/Text Substitutions/Setup.tsb

happy/LICENSE

happy/Makefile

happy/README

happy/TODO

happy/doc

happy/doc/Makefile

happy/doc/happy-1.15-html.tar.gz

happy/doc/happy.1.in

happy/doc/happy.xml

happy/doc/index.html

happy/examples

happy/examples/Calc.ly

happy/examples/DavesExample.ly

happy/examples/ErlParser.ly

happy/examples/ErrorTest.ly

happy/examples/LexerTest.ly

happy/examples/MonadTest.ly

happy/examples/PgnParser.ly

happy/examples/README

happy/examples/SimonsExample.ly

happy/examples/igloo

happy/examples/igloo/Foo.hs

happy/examples/igloo/Lexer.hs

happy/examples/igloo/Lexer.x

happy/examples/igloo/Makefile

happy/examples/igloo/Parser.hs

happy/examples/igloo/Parser.y

happy/examples/igloo/ParserM.hs

happy/examples/igloo/README

happy/happy.spec

happy/mk

happy/mk/boilerplate.mk

happy/mk/config.mk

happy/mk/target.mk

happy/mk/version.mk

happy/src

happy/src/ARRAY-NOTES

happy/src/AbsSyn.lhs

happy/src/First.lhs

happy/src/GenUtils.lhs

happy/src/GetOpt.lhs

happy/src/Grammar.lhs

happy/src/Info.lhs

happy/src/IntSet.lhs

happy/src/LALR.lhs

happy/src/Lexer.lhs

happy/src/Main.lhs

happy/src/Makefile

happy/src/ParseMonad.lhs

happy/src/Parser.hs

happy/src/Parser.ly

happy/src/ProduceCode.lhs

happy/src/ProduceGLRCode.lhs

happy/src/Set.lhs

happy/src/Target.lhs

happy/src/TestLexer.lhs

happy/src/Version.hs

happy/src/happy.prj

happy/src/happy.sh

happy/templates

happy/templates/GLR_Base.lhs

happy/templates/GLR_Lib.lhs

happy/templates/GenericTemplate.hs

happy/templates/Makefile

happy/tests

happy/tests/Makefile

happy/tests/Partial.ly

happy/tests/Test.ly

happy/tests/TestMulti.ly

happy/tests/TestPrecedence.ly

happy/tests/bogus-token.y

happy/tests/bug001.ly

happy/tests/bug002.y

happy/tests/monad001.y

happy/tests/monad002.ly

happy/tests/precedence001.ly

happy/tests/precedence002.y

install-sh

mk/boilerplate.mk

mk/bootstrap.mk

mk/config.h.in

mk/config.mk.in

mk/fptools.css

mk/opts.mk

mk/package.mk

mk/paths.mk

mk/suffix.mk

mk/target.mk

files modified:
Makefile

README

debian/changelog

debian/control

debian/copyright

debian/doc-base

debian/docs

debian/rules

Show diffs side-by-side

added added

removed removed

src/LALR.lhs

-----------------------------------------------------------------------------

Generation of LALR parsing tables.

-----------------------------------------------------------------------------

> module LALR

> (genActionTable, genGotoTable, genLR0items, precalcClosure0,

> propLookaheads, calcLookaheads, mergeLookaheadInfo, countConflicts,

> Lr0Item, Lr1Item)

> where

> import GenUtils

> import Set ( Set )

> import qualified Set hiding ( Set )

> import Grammar

> import Control.Monad.ST

> import Data.Array.ST

> import Data.Array as Array

> import Data.List (nub)

> unionMap :: (Ord b) => (a -> Set b) -> Set a -> Set b

> unionMap f = Set.fold (Set.union . f) Set.empty

This means rule $a$, with dot at $b$ (all starting at 0)

> type Lr0Item = (Int,Int) -- (rule, dot)

> type Lr1Item = (Int,Int,Set Name) -- (rule, dot, lookahead)

> type RuleList = [Lr0Item]

-----------------------------------------------------------------------------

Generating the closure of a set of LR(0) items

Precalculate the rule closure for each non-terminal in the grammar,

using a memo table so that no work is repeated.

> precalcClosure0 :: Grammar -> Name -> RuleList

> precalcClosure0 g =

> \n -> case lookup n info' of

> Nothing -> []

> Just c -> c

> where

> info' :: [(Name, RuleList)]

> info' = map (\(n,rules) -> (n,map (\rule -> (rule,0)) (Set.toAscList rules))) info

> info :: [(Name, Set Int)]

> info = mkClosure (==) (\f -> map (follow f) f)

> (map (\nt -> (nt,Set.fromList (lookupProdsOfName g nt))) nts)

> follow :: [(Name, Set Int)] -> (Name, Set Int) -> (Name, Set Int)

> follow f (nt,rules) = (nt, unionMap (followNT f) rules `Set.union` rules)

> followNT :: [(Name, Set Int)] -> Int -> Set Int

> followNT f rule =

> case findRule g rule 0 of

> Just nt | nt >= firstStartTok && nt < fst_term ->

> case lookup nt f of

> Just rs -> rs

> Nothing -> error "followNT"

> _ -> Set.empty

> nts = non_terminals g

> fst_term = first_term g

> closure0 :: Grammar -> (Name -> RuleList) -> Set Lr0Item -> Set Lr0Item

> closure0 g closureOfNT set = Set.fold addRules Set.empty set

> where

> fst_term = first_term g

> addRules rule set = Set.union (Set.fromList (rule : closureOfRule rule)) set

> closureOfRule (rule,dot) =

> case findRule g rule dot of

> (Just nt) | nt >= firstStartTok && nt < fst_term

> -> closureOfNT nt

> _ -> []

-----------------------------------------------------------------------------

Generating the closure of a set of LR(1) items

> closure1 :: Grammar -> ([Name] -> Set Name) -> [Lr1Item] -> [Lr1Item]

> closure1 g first set

> = fst (mkClosure (\(_,new) _ -> null new) addItems ([],set))

> where

> fst_term = first_term g

> addItems :: ([Lr1Item],[Lr1Item]) -> ([Lr1Item],[Lr1Item])

> addItems (old_items, new_items) = (new_old_items, new_new_items)

> where

> new_old_items = new_items `union_items` old_items

> new_new_items = subtract_items

> (foldr union_items [] (map fn new_items))

> new_old_items

> fn :: Lr1Item -> [Lr1Item]

> fn (rule,dot,as) =

100

> case lookupProdNo g rule of { (name,lhs,_,_) ->

101

> case drop dot lhs of

102

> (b:beta) | b >= firstStartTok && b < fst_term ->

103

> let terms = unionMap

104

> (\a -> first (beta ++ [a])) as

105

> in

106

> [ (rule,0,terms) | rule <- lookupProdsOfName g b ]

107

> _ -> []

108

> }

109

110

Subtract the first set of items from the second.

111

112

> subtract_items :: [Lr1Item] -> [Lr1Item] -> [Lr1Item]

113

> subtract_items items1 items2 = foldr (subtract_item items2) [] items1

114

115

These utilities over item sets are crucial to performance.

116

117

Stamp on overloading with judicious use of type signatures...

118

119

> subtract_item :: [Lr1Item] -> Lr1Item -> [Lr1Item] -> [Lr1Item]

120

> subtract_item [] i result = i : result

121

> subtract_item ((rule,dot,as):items) i@(rule',dot',as') result =

122

> case compare rule' rule of

123

> LT -> i : result

124

> GT -> carry_on

125

> EQ -> case compare dot' dot of

126

> LT -> i : result

127

> GT -> carry_on

128

> EQ -> case Set.difference as' as of

129

> bs | Set.null bs -> result

130

> | otherwise -> (rule,dot,bs) : result

131

> where

132

> carry_on = subtract_item items i result

133

134

Union two sets of items.

135

136

> union_items :: [Lr1Item] -> [Lr1Item] -> [Lr1Item]

137

> union_items is [] = is

138

> union_items [] is = is

139

> union_items (i@(rule,dot,as):is) (i'@(rule',dot',as'):is') =

140

> case compare rule rule' of

141

> LT -> drop_i

142

> GT -> drop_i'

143

> EQ -> case compare dot dot' of

144

> LT -> drop_i

145

> GT -> drop_i'

146

> EQ -> (rule,dot,as `Set.union` as') : union_items is is'

147

> where

148

> drop_i = i : union_items is (i':is')

149

> drop_i' = i' : union_items (i:is) is'

150

151

-----------------------------------------------------------------------------

152

goto(I,X) function

153

154

The input should be the closure of a set of kernel items I together with

155

a token X (terminal or non-terminal. Output will be the set of kernel

156

items for the set of items goto(I,X)

157

158

> gotoClosure :: Grammar -> Set Lr0Item -> Name -> Set Lr0Item

159

> gotoClosure gram i x = unionMap fn i

160

> where

161

> fn (rule_no,dot) =

162

> case findRule gram rule_no dot of

163

> Just t | x == t -> Set.singleton (rule_no,dot+1)

164

> _ -> Set.empty

165

166

-----------------------------------------------------------------------------

167

Generating LR0 Item sets

168

169

The item sets are generated in much the same way as we find the

170

closure of a set of items: we use two sets, those which have already

171

generated more sets, and those which have just been generated. We

172

keep iterating until the second set is empty.

173

174

The addItems function is complicated by the fact that we need to keep

175

information about which sets were generated by which others.

176

177

> type ItemSetWithGotos = (Set Lr0Item, [(Name,Int)])

178

179

> genLR0items :: Grammar -> (Name -> RuleList) -> [ItemSetWithGotos]

180

> genLR0items g precalcClosures

181

> = fst (mkClosure (\(old,new) _ -> null new)

182

> addItems

183

> (([],startRules)))

184

> where

185

186

> n_starts = length (starts g)

187

> startRules :: [Set Lr0Item]

188

> startRules = [ Set.singleton (rule,0) | rule <- [0..n_starts] ]

189

190

> tokens = non_terminals g ++ terminals g

191

192

> addItems :: ([ItemSetWithGotos], [Set Lr0Item])

193

> -> ([ItemSetWithGotos], [Set Lr0Item])

194

195

> addItems (oldSets,newSets) = (newOldSets, reverse newNewSets)

196

> where

197

198

> newOldSets = oldSets ++ (zip newSets intgotos)

199

200

> itemSets = map fst oldSets ++ newSets

201

202

First thing to do is for each set in I in newSets, generate goto(I,X)

203

for each token (terminals and nonterminals) X.

204

205

> gotos :: [[(Name,Set Lr0Item)]]

206

> gotos = map (filter (not . Set.null . snd))

207

> (map (\i -> let i' = closure0 g precalcClosures i in

208

> [ (x,gotoClosure g i' x) | x <- tokens ]) newSets)

209

210

Next, we assign each new set a number, which is the index of this set

211

in the list of sets comprising all the sets generated so far plus

212

those generated in this iteration. We also filter out those sets that

213

are new, i.e. don't exist in the current list of sets, so that they

214

can be added.

215

216

We also have to make sure that there are no duplicate sets in the

217

*current* batch of goto(I,X) sets, as this could be disastrous. I

218

think I've squished this one with the '++ reverse newSets' in

219

numberSets.

220

221

numberSets is built this way so we can use it quite neatly with a foldr.

222

Unfortunately, the code's a little opaque.

223

224

> numberSets

225

> :: [(Name,Set Lr0Item)]

226

> -> (Int,

227

> [[(Name,Int)]],

228

> [Set Lr0Item])

229

> -> (Int, [[(Name,Int)]], [Set Lr0Item])

230

231

> numberSets [] (i,gotos,newSets) = (i,([]:gotos),newSets)

232

> numberSets ((x,gotoix):rest) (i,g:gotos,newSets)

233

> = numberSets rest

234

> (case indexInto 0 gotoix (itemSets ++ reverse newSets) of

235

> Just j -> (i, ((x,j):g):gotos, newSets)

236

> Nothing -> (i+1,((x,i):g):gotos, gotoix:newSets))

237

238

Finally, do some fiddling around to get this all in the form we want.

239

240

> intgotos :: [[(Name,Int)]]

241

> newNewSets :: [Set Lr0Item]

242

> (_, ([]:intgotos), newNewSets) =

243

> foldr numberSets (length newOldSets, [[]], []) gotos

244

245

> indexInto :: Eq a => Int -> a -> [a] -> Maybe Int

246

> indexInto _ _ [] = Nothing

247

> indexInto i x (y:ys) | x == y = Just i

248

> | otherwise = indexInto (i+1) x ys

249

250

-----------------------------------------------------------------------------

251

Computing propagation of lookaheads

252

253

ToDo: generate this info into an array to be used in the subsequent

254

calcLookaheads pass.

255

256

> propLookaheads

257

> :: Grammar

258

> -> [(Set Lr0Item,[(Name,Int)])] -- LR(0) kernel sets

259

> -> ([Name] -> Set Name) -- First function

260

> -> (

261

> [(Int, Lr0Item, Set Name)], -- spontaneous lookaheads

262

> Array Int [(Lr0Item, Int, Lr0Item)] -- propagated lookaheads

263

> )

264

265

> propLookaheads gram sets first = (concat s, array (0,length sets - 1)

266

> [ (a,b) | (a,b) <- p ])

267

> where

268

269

> (s,p) = unzip (zipWith propLASet sets [0..])

270

271

> propLASet :: (Set Lr0Item, [(Name, Int)]) -> Int -> ([(Int, Lr0Item, Set Name)],(Int,[(Lr0Item, Int, Lr0Item)]))

272

> propLASet (set,goto) i = (start_spont ++ concat s, (i, concat p))

273

> where

274

275

> (s,p) = unzip (map propLAItem (Set.toAscList set))

276

277

> -- spontaneous EOF lookaheads for each start state & rule...

278

> start_info :: [(String, Name, Name, Bool)]

279

> start_info = starts gram

280

281

> start_spont :: [(Int, Lr0Item ,Set Name)]

282

> start_spont = [ (start, (start,0),

283

> Set.singleton (startLookahead gram partial))

284

> | (start, (_,_,_,partial)) <-

285

> zip [ 0 .. length start_info - 1] start_info]

286

287

> propLAItem :: Lr0Item -> ([(Int, Lr0Item, Set Name)], [(Lr0Item, Int, Lr0Item)])

288

> propLAItem item@(rule,dot) = (spontaneous, propagated)

289

> where

290

291

> j = closure1 gram first [(rule,dot,Set.singleton dummyTok)]

292

293

> spontaneous :: [(Int, Lr0Item, Set Name)]

294

> spontaneous = concat [

295

> (case findRule gram rule dot of

296

> Nothing -> []

297

> Just x -> case lookup x goto of

298

> Nothing -> error "spontaneous"

299

> Just k ->

300

> case Set.filter (/= dummyTok) ts of

301

> ts' | Set.null ts' -> []

302

> | otherwise -> [(k, (rule, dot+1), ts')])

303

> | (rule,dot,ts) <- j ]

304

305

> propagated :: [(Lr0Item, Int, Lr0Item)]

306

> propagated = concat [

307

> (case findRule gram rule dot of

308

> Nothing -> []

309

> Just x -> case lookup x goto of

310

> Nothing -> error "propagated"

311

> Just k -> [(item, k, (rule, dot+1))])

312

> | (rule,dot,ts) <- j, dummyTok `elem` (Set.toAscList ts) ]

313

314

The lookahead for a start rule depends on whether it was declared

315

with %name or %partial: a %name parser is assumed to parse the whole

316

input, ending with EOF, whereas a %partial parser may parse only a

317

part of the input: it accepts when the error token is found.

318

319

> startLookahead :: Grammar -> Bool -> Name

320

> startLookahead gram partial = if partial then errorTok else eof_term gram

321

322

-----------------------------------------------------------------------------

323

Calculate lookaheads

324

325

Special version using a mutable array:

326

327

> calcLookaheads

328

> :: Int -- number of states

329

> -> [(Int, Lr0Item, Set Name)] -- spontaneous lookaheads

330

> -> Array Int [(Lr0Item, Int, Lr0Item)] -- propagated lookaheads

331

> -> Array Int [(Lr0Item, Set Name)]

332

333

> calcLookaheads n_states spont prop

334

> = runST (do

335

> array <- newArray (0,n_states) []

336

> propagate array (foldr fold_lookahead [] spont)

337

> freeze array

338

> )

339

340

> where

341

> propagate :: STArray s Int [(Lr0Item, Set Name)]

342

> -> [(Int, Lr0Item, Set Name)] -> ST s ()

343

> propagate array [] = return ()

344

> propagate array new = do

345

> let

346

> items = [ (i,item'',s) | (j,item,s) <- new,

347

> (item',i,item'') <- prop ! j,

348

> item == item' ]

349

> new_new <- get_new array items []

350

> add_lookaheads array new

351

> propagate array new_new

352

353

This function is needed to merge all the (set_no,item,name) triples

354

into (set_no, item, set name) triples. It can be removed when we get

355

the spontaneous lookaheads in the right form to begin with (ToDo).

356

357

> add_lookaheads array [] = return ()

358

> add_lookaheads array ((i,item,s) : lookaheads) = do

359

> las <- readArray array i

360

> writeArray array i (add_lookahead item s las)

361

> add_lookaheads array lookaheads

362

363

> get_new array [] new = return new

364

> get_new array (l@(i,item,s):las) new = do

365

> state_las <- readArray array i

366

> get_new array las (get_new' l state_las new)

367

368

> add_lookahead :: Lr0Item -> Set Name -> [(Lr0Item,Set Name)] ->

369

> [(Lr0Item,Set Name)]

370

> add_lookahead item s [] = [(item,s)]

371

> add_lookahead item s (m@(item',s') : las)

372

> | item == item' = (item, s `Set.union` s') : las

373

> | otherwise = m : add_lookahead item s las

374

375

> get_new' :: (Int,Lr0Item,Set Name) -> [(Lr0Item,Set Name)] ->

376

> [(Int,Lr0Item,Set Name)] -> [(Int,Lr0Item,Set Name)]

377

> get_new' l [] new = l : new

378

> get_new' l@(i,item,s) (m@(item',s') : las) new

379

> | item == item' =

380

> let s'' = Set.filter (\x -> not (Set.member x s')) s in

381

> if Set.null s'' then new else

382

> ((i,item,s''):new)

383

> | otherwise =

384

> get_new' l las new

385

386

> fold_lookahead :: (Int,Lr0Item,Set Name) -> [(Int,Lr0Item,Set Name)]

387

> -> [(Int,Lr0Item,Set Name)]

388

> fold_lookahead l [] = [l]

389

> fold_lookahead l@(i,item,s) (m@(i',item',s'):las)

390

> | i == i' && item == item' = (i,item, s `Set.union` s'):las

391

> | i < i' = (i,item,s):m:las

392

> | otherwise = m : fold_lookahead l las

393

394

Normal version:

395

396

calcLookaheads

397

:: Int -- number of states

398

-> [(Int, Lr0Item, Set Name)] -- spontaneous lookaheads

399

-> Array Int [(Lr0Item, Int, Lr0Item)] -- propagated lookaheads

400

-> Array Int [(Lr0Item, Set Name)]

401

402

calcLookaheads n_states spont prop

403

= rebuildArray $ fst (mkClosure (\(_,new) _ -> null new) propagate

404

([], foldr addLookahead [] spont))

405

where

406

407

rebuildArray :: [(Int, Lr0Item, Set Name)] -> Array Int [(Lr0Item, Set Name)]

408

rebuildArray xs = accumArray (++) [] (0,n_states-1)

409

[ (a, [(b,c)]) | (a,b,c) <- xs ]

410

411

propagate (las,new) =

412

let

413

items = [ (i,item'',s) | (j,item,s) <- new,

414

(item',i,item'') <- prop ! j,

415

item == item' ]

416

new_new = foldr (\i new -> getNew i las new) [] items

417

new_las = foldr addLookahead las new

418

419

(new_las, new_new)

420

421

addLookahead :: (Int,Lr0Item,Set Name) -> [(Int,Lr0Item,Set Name)]

422

-> [(Int,Lr0Item,Set Name)]

423

addLookahead l [] = [l]

424

addLookahead l@(i,item,s) (m@(i',item',s'):las)

425

| i == i' && item == item' = (i,item, s `Set.union` s'):las

426

| i < i' = (i,item,s):m:las

427

| otherwise = m : addLookahead l las

428

429

getNew :: (Int,Lr0Item,Set Name) -> [(Int,Lr0Item,Set Name)]

430

-> [(Int,Lr0Item,Set Name)] -> [(Int,Lr0Item,Set Name)]

431

getNew l [] new = l:new

432

getNew l@(i,item,s) (m@(i',item',s'):las) new

433

| i == i' && item == item' =

434

let s'' = filter (`notElem` s') s in

435

if null s'' then new else

436

((i,item,s''):new)

437

| i < i' = (i,item,s):new

438

| otherwise = getNew l las new

439

440

-----------------------------------------------------------------------------

441

Merge lookaheads

442

443

Stick the lookahead info back into the state table.

444

445

> mergeLookaheadInfo

446

> :: Array Int [(Lr0Item, Set Name)] -- lookahead info

447

> -> [(Set Lr0Item, [(Name,Int)])] -- state table

448

> -> [ ([Lr1Item], [(Name,Int)]) ]

449

450

> mergeLookaheadInfo lookaheads sets

451

> = zipWith mergeIntoSet sets [0..]

452

> where

453

454

> mergeIntoSet :: (Set Lr0Item, [(Name, Int)]) -> Int -> ([Lr1Item], [(Name, Int)])

455

> mergeIntoSet (items, goto) i

456

> = (concat (map mergeIntoItem (Set.toAscList items)), goto)

457

> where

458

459

> mergeIntoItem :: Lr0Item -> [Lr1Item]

460

> mergeIntoItem item@(rule,dot)

461

> = [(rule,dot,la)]

462

> where la = case [ s | (item',s) <- lookaheads ! i,

463

> item == item' ] of

464

> [] -> Set.empty

465

> [x] -> x

466

> _ -> error "mergIntoItem"

467

468

-----------------------------------------------------------------------------

469

Generate the goto table

470

471

This is pretty straightforward, given all the information we stored

472

while generating the LR0 sets of items.

473

474

Generating the goto table doesn't need lookahead info.

475

476

> genGotoTable :: Grammar -> [(Set Lr0Item,[(Name,Int)])] -> GotoTable

477

> genGotoTable g sets = gotoTable

478

> where

479

> Grammar{ first_nonterm = fst_nonterm,

480

> first_term = fst_term,

481

> non_terminals = non_terms } = g

482

483

> -- goto array doesn't include %start symbols

484

> gotoTable = listArray (0,length sets-1)

485

> [

486

> (array (fst_nonterm, fst_term-1) [

487

> (n, case lookup n goto of

488

> Nothing -> NoGoto

489

> Just s -> Goto s)

490

> | n <- non_terms,

491

> n >= fst_nonterm, n < fst_term ])

492

> | (set,goto) <- sets ]

493

494

-----------------------------------------------------------------------------

495

Generate the action table

496

497

> genActionTable :: Grammar -> ([Name] -> Set Name) ->

498

> [([Lr1Item],[(Name,Int)])] -> ActionTable

499

> genActionTable g first sets = actionTable

500

> where

501

> Grammar { first_term = fst_term,

502

> terminals = terms,

503

> starts = starts,

504

> priorities = prios } = g

505

506

> n_starts = length starts

507

> isStartRule rule = rule < n_starts -- a bit hacky, but it'll do for now

508

509

> term_lim = (head terms,last terms)

510

> actionTable = array (0,length sets-1)

511

> [ (set_no, accumArray res

512

> LR'Fail term_lim

513

> (possActions goto set))

514

> | ((set,goto),set_no) <- zip sets [0..] ]

515

516

> possAction goto set (rule,pos,la) =

517

> case findRule g rule pos of

518

> Just t | t >= fst_term || t == errorTok ->

519

> case lookup t goto of

520

> Nothing -> []

521

> Just j ->

522

> case lookup t prios of

523

> Nothing -> [ (t,LR'Shift j{-'-} No) ]

524

> Just p -> [ (t,LR'Shift j{-'-} p) ]

525

> Nothing

526

> | isStartRule rule

527

> -> let (_,_,_,partial) = starts !! rule in

528

> [ (startLookahead g partial, LR'Accept{-'-}) ]

529

> | otherwise

530

> -> case lookupProdNo g rule of

531

> (_,_,_,p) -> zip (Set.toAscList la) (repeat (LR'Reduce rule p))

532

> _ -> []

533

534

> possActions goto coll =

535

> (concat [ possAction goto coll item |

536

> item <- closure1 g first coll ])

537

538

These comments are now out of date! /JS

539

540

Here's how we resolve conflicts, leaving a complete record of the

541

conflicting actions in an LR'Multiple structure for later output in

542

the info file.

543

544

Shift/reduce conflicts are always resolved as shift actions, and

545

reduce/reduce conflicts are resolved as a reduce action using the rule

546

with the lowest number (i.e. the rule that comes first in the grammar

547

file.)

548

549

NOTES on LR'MustFail: this was introduced as part of the precedence

550

parsing changes. The problem with LR'Fail is that it is a soft

551

failure: we sometimes substitute an LR'Fail for an LR'Reduce (eg. when

552

computing default actions), on the grounds that an LR'Fail in this

553

state will also be an LR'Fail in the goto state, so we'll fail

554

eventually. This may not be true with precedence parsing, though. If

555

there are two non-associative operators together, we must fail at this

556

point rather than reducing. Hence the use of LR'MustFail.

557

558

559

NOTE: on (LR'Multiple as a) handling

560

PCC [sep04] has changed this to have the following invariants:

561

* the winning action appears only once, in the "a" slot

562

* only reductions appear in the "as" list

563

* there are no duplications

564

This removes complications elsewhere, where LR'Multiples were

565

building up tree structures...

566

567

> res LR'Fail x = x

568

> res x LR'Fail = x

569

> res LR'MustFail x = LR'MustFail

570

> res x LR'MustFail = LR'MustFail

571

> res x x' | x == x' = x

572

> res (LR'Accept) _ = LR'Accept

573

> res _ (LR'Accept) = LR'Accept

574

575

> res a@(LR'Multiple as x) b@(LR'Multiple bs x')

576

> | x == x' = LR'Multiple (nub $ as ++ bs) x

577

> -- merge dropped reductions for identical action

578

579

> res a@(LR'Multiple as x) b@(LR'Multiple bs x')

580

> = case res x x' of

581

> LR'Multiple cs a

582

> | a == x -> LR'Multiple (nub $ x' : as ++ bs ++ cs) x

583

> | a == x' -> LR'Multiple (nub $ x : as ++ bs ++ cs) x'

584

> | otherwise -> error "failed invariant in resolve"

585

> -- last means an unexpected change

586

> other -> other

587

> -- merge dropped reductions for clashing actions, but only

588

> -- if they were S/R or R/R

589

590

> res a@(LR'Multiple _ _) b = res a (LR'Multiple [] b)

591

> res a b@(LR'Multiple _ _) = res (LR'Multiple [] a) b

592

> -- leave cases above to do the appropriate merging

593

594

> res a@(LR'Shift s p) b@(LR'Reduce s' p') = res b a

595

> res a@(LR'Reduce s p) b@(LR'Shift s' p')

596

> = case (p,p') of

597

> (No,_) -> LR'Multiple [a] b -- shift wins

598

> (_,No) -> LR'Multiple [a] b -- shift wins

599

> (Prio c i, Prio _ j)

600

> | i < j -> b

601

> | i > j -> a

602

> | otherwise ->

603

> case c of

604

> LeftAssoc -> a

605

> RightAssoc -> b

606

> None -> LR'MustFail

607

> res a@(LR'Reduce r p) b@(LR'Reduce r' p')

608

> = case (p,p') of

609

> (No,_) -> LR'Multiple [a] b -- give to earlier rule?

610

> (_,No) -> LR'Multiple [a] b

611

> (Prio c i, Prio _ j)

612

> | i < j -> b

613

> | j > i -> a

614

> | r < r' -> LR'Multiple [b] a

615

> | otherwise -> LR'Multiple [a] b

616

> res _ _ = error "confict in resolve"

617

618

-----------------------------------------------------------------------------

619

Count the conflicts

620

621

> countConflicts :: ActionTable -> (Array Int (Int,Int), (Int,Int))

622

> countConflicts action

623

> = (conflictArray, foldr (\(a,b) (c,d) -> (a+c, b+d)) (0,0) conflictList)

624

625

> where

626

627

> conflictArray = listArray (Array.bounds action) conflictList

628

> conflictList = map countConflictsState (assocs action)

629

630

> countConflictsState (state, actions)

631

> = foldr countMultiples (0,0) (elems actions)

632

> where

633

> countMultiples (LR'Multiple (_:_) (LR'Shift{})) (sr,rr)

634

> = (sr + 1, rr)

635

> countMultiples (LR'Multiple (_:_) (LR'Reduce{})) (sr,rr)

636

> = (sr, rr + 1)

637

> countMultiples (LR'Multiple as a) (sr,rr)

638

> = error "bad conflict representation"

639

> countMultiples _ c = c

640

641

-----------------------------------------------------------------------------

642

643

> findRule :: Grammar -> Int -> Int -> Maybe Name

644

> findRule g rule dot =

645

> case lookupProdNo g rule of

646

> (_,lhs,_,_) -> case drop dot lhs of

647

> (a:_) -> Just a

648

> _ -> Nothing

Older »