diff options
| author | kr.angelov <kr.angelov@gmail.com> | 2007-09-24 14:36:19 +0000 |
|---|---|---|
| committer | kr.angelov <kr.angelov@gmail.com> | 2007-09-24 14:36:19 +0000 |
| commit | c6c7557b13091116f66884c0d6105dca0fd33df3 (patch) | |
| tree | 03b141c295280c703cf39f82df099d5168b1842a /src/GF/Parsing | |
| parent | 9222e4d34c00cffb47a581693a17403e1e4cc3d2 (diff) | |
merge FCFGParsing with GF.Parsing.FCFG
Diffstat (limited to 'src/GF/Parsing')
| -rw-r--r-- | src/GF/Parsing/FCFG.hs | 88 | ||||
| -rw-r--r-- | src/GF/Parsing/GFC.hs | 86 |
2 files changed, 129 insertions, 45 deletions
diff --git a/src/GF/Parsing/FCFG.hs b/src/GF/Parsing/FCFG.hs index 91b4201b7..7784285e1 100644 --- a/src/GF/Parsing/FCFG.hs +++ b/src/GF/Parsing/FCFG.hs @@ -8,25 +8,91 @@ ----------------------------------------------------------------------------- module GF.Parsing.FCFG - (parseFCF, module GF.Parsing.FCFG.PInfo) where + (parseFCF,buildFCFPInfo,FCFPInfo(..),makeFinalEdge) where -import GF.Data.Operations (Err(..)) +import GF.Data.SortedList +import GF.Data.Assoc +import GF.Infra.PrintClass + +import GF.Formalism.FCFG import GF.Formalism.Utilities -import GF.Parsing.FCFG.PInfo import qualified GF.Parsing.FCFG.Active as Active -import GF.Infra.PrintClass +import GF.Parsing.FCFG.PInfo + +import GF.Canon.GFCC.AbsGFCC +import GF.Canon.GFCC.ErrM + ---------------------------------------------------------------------- -- parsing -parseFCF :: String -> Err (FCFParser) -parseFCF prs | prs `elem` strategies = Ok $ parseFCF' prs - | otherwise = Bad $ "FCFG parsing strategy not defined: " ++ prs +-- main parsing function + +parseFCF :: + String -> -- ^ parsing strategy + FCFPInfo -> -- ^ compiled grammar (fcfg) + CId -> -- ^ starting category + [String] -> -- ^ input tokens + Err [Exp] -- ^ resulting GF terms +parseFCF strategy pinfo startCat inString = + do let inTokens = input inString + startCats = filter isStart $ grammarCats pinfo + isStart cat = fcat2cid cat == startCat + fcfParser <- parseFCF strategy + let chart = fcfParser pinfo startCats inTokens + (i,j) = inputBounds inTokens + finalEdges = [makeFinalEdge cat i j | cat <- startCats] + forests = map cnv_forests $ chart2forests chart (const False) finalEdges + filteredForests = forests >>= applyProfileToForest + trees = nubsort $ filteredForests >>= forest2trees + return $ map tree2term trees + where + parseFCF :: String -> Err (FCFParser) + parseFCF "bottomup" = Ok $ Active.parse "b" + parseFCF "topdown" = Ok $ Active.parse "t" + parseFCF strat = Bad $ "FCFG parsing strategy not defined: " ++ strat + -strategies = words "bottomup topdown" +cnv_forests FMeta = FMeta +cnv_forests (FNode (Name (CId n) p) fss) = FNode (Name (CId n) (map cnv_profile p)) (map (map cnv_forests) fss) +cnv_forests (FString x) = FString x +cnv_forests (FInt x) = FInt x +cnv_forests (FFloat x) = FFloat x + +cnv_profile (Unify x) = Unify x +cnv_profile (Constant x) = Constant (cnv_forests2 x) + +cnv_forests2 FMeta = FMeta +cnv_forests2 (FNode (CId n) fss) = FNode (CId n) (map (map cnv_forests2) fss) +cnv_forests2 (FString x) = FString x +cnv_forests2 (FInt x) = FInt x +cnv_forests2 (FFloat x) = FFloat x + +---------------------------------------------------------------------- +-- parse trees to GFCC terms + +tree2term :: SyntaxTree CId -> Exp +tree2term (TNode f ts) = Tr (AC f) (map tree2term ts) + +tree2term (TString s) = Tr (AS s) [] +tree2term (TInt n) = Tr (AI n) [] +tree2term (TFloat f) = Tr (AF f) [] +tree2term (TMeta) = Tr AM [] + +---------------------------------------------------------------------- +-- conversion and unification of forests -parseFCF' :: String -> FCFParser -parseFCF' "bottomup" pinfo starts toks = Active.parse "b" pinfo starts toks -parseFCF' "topdown" pinfo starts toks = Active.parse "t" pinfo starts toks +-- simplest implementation +applyProfileToForest :: SyntaxForest FName -> [SyntaxForest CId] +applyProfileToForest (FNode name@(Name fun profile) children) + | isCoercionF name = concat chForests + | otherwise = [ FNode fun chForests | not (null chForests) ] + where chForests = concat [ applyProfileM unifyManyForests profile forests | + forests0 <- children, + forests <- mapM applyProfileToForest forests0 ] +applyProfileToForest (FString s) = [FString s] +applyProfileToForest (FInt n) = [FInt n] +applyProfileToForest (FFloat f) = [FFloat f] +applyProfileToForest (FMeta) = [FMeta] diff --git a/src/GF/Parsing/GFC.hs b/src/GF/Parsing/GFC.hs index 948d3577b..2486efd81 100644 --- a/src/GF/Parsing/GFC.hs +++ b/src/GF/Parsing/GFC.hs @@ -25,8 +25,9 @@ import qualified GF.Grammar.Grammar as Grammar import qualified GF.Grammar.Macros as Macros import qualified GF.Canon.AbsGFC as AbsGFC import qualified GF.Canon.GFCC.AbsGFCC as AbsGFCC +import qualified GF.Canon.GFCC.ErrM as ErrM import qualified GF.Infra.Ident as Ident -import GF.CF.CFIdent (CFCat, cfCat2Ident, CFTok, wordsCFTok) +import GF.CF.CFIdent (CFCat, cfCat2Ident, CFTok, wordsCFTok, prCFTok) import GF.Data.SortedList import GF.Data.Assoc @@ -73,26 +74,12 @@ parse :: String -- ^ parsing algorithm (mcfg or cfg) -> [CFTok] -- ^ input tokens -> Err [Grammar.Term] -- ^ resulting GF terms -parse prs strategy pinfo abs startCat inString = - do let inTokens = tracePrt "Parsing.GFC - input tokens" prt $ - inputMany (map wordsCFTok inString) - forests <- selectParser prs strategy pinfo startCat inTokens - traceM "Parsing.GFC - nr. unfiltered forests" (prt (length forests)) - traceM "Parsing.GFC - nr. unfiltered trees" (prt (length (forests >>= forest2trees))) - let filteredForests = tracePrt "Parsing.GFC - nr. forests" (prt . length) $ - forests >>= applyProfileToForest - -- compactFs = tracePrt "#compactForests" (prt . length) $ - -- tracePrt "compactForests" (prtBefore "\n") $ - -- compactForests forests - trees = tracePrt "Parsing.GFC - nr. trees" (prt . length) $ - nubsort $ filteredForests >>= forest2trees - -- compactFs >>= forest2trees - return $ map (tree2term abs) trees - -- parsing via CFG -selectParser "c" strategy pinfo startCat inTokens - = do let startCats = tracePrt "Parsing.GFC - starting CF categories" prt $ +parse "c" strategy pinfo abs startCat inString + = do let inTokens = tracePrt "Parsing.GFC - input tokens" prt $ + inputMany (map wordsCFTok inString) + let startCats = tracePrt "Parsing.GFC - starting CF categories" prt $ filter isStart $ map fst $ aAssocs $ PC.topdownRules cfpi isStart cat = ccat2scat cat == cfCat2Ident startCat cfpi = cfPInfo pinfo @@ -103,11 +90,25 @@ selectParser "c" strategy pinfo startCat inTokens C.grammar2chart cfChart finalEdges = tracePrt "Parsing.GFC - final chart edges" prt $ map (uncurry Edge (inputBounds inTokens)) startCats - return $ chart2forests chart (const False) finalEdges + forests = chart2forests chart (const False) finalEdges + traceM "Parsing.GFC - nr. unfiltered forests" (prt (length forests)) + traceM "Parsing.GFC - nr. unfiltered trees" (prt (length (forests >>= forest2trees))) + let filteredForests = tracePrt "Parsing.GFC - nr. forests" (prt . length) $ + forests >>= applyProfileToForest + -- compactFs = tracePrt "#compactForests" (prt . length) $ + -- tracePrt "compactForests" (prtBefore "\n") $ + -- compactForests forests + trees = tracePrt "Parsing.GFC - nr. trees" (prt . length) $ + nubsort $ filteredForests >>= forest2trees + -- compactFs >>= forest2trees + return $ map (tree2term abs) trees + -- parsing via MCFG -selectParser "m" strategy pinfo startCat inTokens - = do let startCats = tracePrt "Parsing.GFC - starting MCF categories" prt $ +parse "m" strategy pinfo abs startCat inString + = do let inTokens = tracePrt "Parsing.GFC - input tokens" prt $ + inputMany (map wordsCFTok inString) + let startCats = tracePrt "Parsing.GFC - starting MCF categories" prt $ filter isStart $ PM.grammarCats mcfpi isStart cat = mcat2scat cat == cfCat2Ident startCat mcfpi = mcfPInfo pinfo @@ -116,20 +117,28 @@ selectParser "m" strategy pinfo startCat inTokens finalEdges = tracePrt "Parsing.GFC - final chart edges" prt $ [ PM.makeFinalEdge cat lbl (inputBounds inTokens) | cat@(MCat _ [lbl]) <- startCats ] - return $ chart2forests chart (const False) finalEdges + forests = chart2forests chart (const False) finalEdges + traceM "Parsing.GFC - nr. unfiltered forests" (prt (length forests)) + traceM "Parsing.GFC - nr. unfiltered trees" (prt (length (forests >>= forest2trees))) + let filteredForests = tracePrt "Parsing.GFC - nr. forests" (prt . length) $ + forests >>= applyProfileToForest + -- compactFs = tracePrt "#compactForests" (prt . length) $ + -- tracePrt "compactForests" (prtBefore "\n") $ + -- compactForests forests + trees = tracePrt "Parsing.GFC - nr. trees" (prt . length) $ + nubsort $ filteredForests >>= forest2trees + -- compactFs >>= forest2trees + return $ map (tree2term abs) trees + -- parsing via FCFG -selectParser "f" strategy pinfo startCat inTokens - = do let startCats = filter isStart $ PF.grammarCats fcfpi - isStart cat = cat' == cfCat2Ident startCat - where AbsGFCC.CId x = fcat2cid cat - cat' = Ident.IC x - fcfpi = fcfPInfo pinfo - fcfParser <- PF.parseFCF strategy - let chart = fcfParser fcfpi startCats inTokens - (i,j) = inputBounds inTokens - finalEdges = [PF.makeFinalEdge cat i j | cat <- startCats] - return $ map cnv_forests $ chart2forests chart (const False) finalEdges +parse "f" strategy pinfo abs startCat inString = + let Ident.IC x = cfCat2Ident startCat + cat' = AbsGFCC.CId x + in case PF.parseFCF strategy (fcfPInfo pinfo) cat' (map prCFTok inString) of + ErrM.Ok es -> Ok (map (exp2term abs) es) + ErrM.Bad msg -> Bad msg + -- error parser: selectParser prs strategy _ _ _ = Bad $ "Parser '" ++ prs ++ "' not defined with strategy: " ++ strategy @@ -159,6 +168,15 @@ tree2term abs (TInt n) = Macros.int2term n tree2term abs (TFloat f) = Macros.float2term f tree2term abs (TMeta) = Macros.mkMeta 0 +exp2term :: Ident.Ident -> AbsGFCC.Exp -> Grammar.Term +exp2term abs (AbsGFCC.Tr a es) = Macros.mkApp (atom2term abs a) (map (exp2term abs) es) + +atom2term :: Ident.Ident -> AbsGFCC.Atom -> Grammar.Term +atom2term abs (AbsGFCC.AC (AbsGFCC.CId f)) = Macros.qq (abs,Ident.IC f) +atom2term abs (AbsGFCC.AS s) = Macros.string2term s +atom2term abs (AbsGFCC.AI n) = Macros.int2term n +atom2term abs (AbsGFCC.AF f) = Macros.float2term f +atom2term abs AbsGFCC.AM = Macros.mkMeta 0 ---------------------------------------------------------------------- -- conversion and unification of forests |
