summaryrefslogtreecommitdiff
path: root/src/GF
diff options
context:
space:
mode:
Diffstat (limited to 'src/GF')
-rw-r--r--src/GF/Speech/TransformCFG.hs21
1 files changed, 18 insertions, 3 deletions
diff --git a/src/GF/Speech/TransformCFG.hs b/src/GF/Speech/TransformCFG.hs
index c640caa0f..049aa8fc4 100644
--- a/src/GF/Speech/TransformCFG.hs
+++ b/src/GF/Speech/TransformCFG.hs
@@ -41,7 +41,6 @@ import Data.Monoid (mconcat)
import Data.Set (Set)
import qualified Data.Set as Set
-
-- not very nice to replace the structured CFCat type with a simple string
type CFRule_ = CFRule Cat_ CFTerm Token
@@ -104,14 +103,21 @@ removeCycles = groupProds . f . ungroupProds
-- | Removes productions which use categories which have no productions.
-- Only does one pass through the grammar.
-bottomUpFilter :: CFRules -> CFRules
-bottomUpFilter rs = k'
+bottomUpFilter_old :: CFRules -> CFRules
+bottomUpFilter_old rs = k'
where
keep = filter (not . null . snd) rs
allCats = nub [c | (_,r) <- rs, CFRule _ rhs _ <- r, Cat c <- rhs]
emptyCats = filter (nothingOrNull . flip lookup rs) allCats
k' = map (\ (c,xs) -> (c, filter (not . anyUsedBy emptyCats) xs)) keep
+-- | Better bottom-up filter that also removes categories which contain no finite
+-- strings.
+bottomUpFilter :: CFRules -> CFRules
+bottomUpFilter gr = fix grow []
+ where grow g = g `unionCFRules` filterCFRules (all (okSym g) . ruleRhs) gr
+ okSym g = symbol (`elem` allCats g) (const True)
+
-- | Removes categories which are not reachable from the start category.
-- Only does one pass through the grammar.
topDownFilter :: Cat_ -> CFRules -> CFRules
@@ -305,6 +311,15 @@ catRules rs c = fromMaybe [] (lookup c rs)
catSetRules :: CFRules -> Set Cat_ -> [CFRule_]
catSetRules g cs = concat [rs | (c,rs) <- g, c `Set.member` cs]
+unionCFRules :: CFRules -> CFRules -> CFRules
+unionCFRules x y = Map.toList $ Map.map Set.toList $ Map.unionWith Set.union (fromCFRules x) (fromCFRules y)
+ where
+ fromCFRules :: CFRules -> Map Cat_ (Set CFRule_)
+ fromCFRules g = Map.fromListWith Set.union [(c, Set.fromList rs) | (c,rs) <- g]
+
+filterCFRules :: (CFRule_ -> Bool) -> CFRules -> CFRules
+filterCFRules p gr = [(c,rs') | (c,rs) <- gr, let rs' = filter p rs, not (null rs')]
+
lhsCat :: CFRule c n t -> c
lhsCat (CFRule c _ _) = c