diff options
| author | krasimir <krasimir@chalmers.se> | 2010-04-30 14:36:06 +0000 |
|---|---|---|
| committer | krasimir <krasimir@chalmers.se> | 2010-04-30 14:36:06 +0000 |
| commit | 8460598801b644f323db0b7d7ca879e3acb9215b (patch) | |
| tree | 02aaf44ec76bf9738f996bfc1688a94f308cde27 /src/runtime/haskell/PGF/Linearize.hs | |
| parent | 7a4cb3c2715c5dd61309b9bc0309142a44393c29 (diff) | |
first incarnation of the bracketed string API
Diffstat (limited to 'src/runtime/haskell/PGF/Linearize.hs')
| -rw-r--r-- | src/runtime/haskell/PGF/Linearize.hs | 174 |
1 files changed, 97 insertions, 77 deletions
diff --git a/src/runtime/haskell/PGF/Linearize.hs b/src/runtime/haskell/PGF/Linearize.hs index 058d8281f..4a399f5e9 100644 --- a/src/runtime/haskell/PGF/Linearize.hs +++ b/src/runtime/haskell/PGF/Linearize.hs @@ -1,8 +1,15 @@ -module PGF.Linearize(linearizes,markLinearizes,tabularLinearizes) where +module PGF.Linearize + ( linearize + , linearizeAll + , linearizeAllLang + , bracketedLinearize + , tabularLinearizes + ) where import PGF.CId import PGF.Data import PGF.Macros +import PGF.Expr import Data.Array.IArray import Data.List import Control.Monad @@ -10,99 +17,112 @@ import qualified Data.Map as Map import qualified Data.IntMap as IntMap import qualified Data.Set as Set --- linearization and computation of concrete PGF Terms +-------------------------------------------------------------------- +-- The API +-------------------------------------------------------------------- -type LinTable = Array LIndex [Tokn] +-- | Linearizes given expression as string in the language +linearize :: PGF -> Language -> Tree -> String +linearize pgf lang = concat . take 1 . map (unwords . concatMap flattenBracketedString . snd . untokn "" . (!0)) . linTree pgf lang -linearizes :: PGF -> CId -> Expr -> [String] -linearizes pgf lang = map (unwords . untokn . (! 0)) . linTree pgf lang (\_ _ lint -> lint) +-- | The same as 'linearizeAllLang' but does not return +-- the language. +linearizeAll :: PGF -> Tree -> [String] +linearizeAll pgf = map snd . linearizeAllLang pgf -linTree :: PGF -> Language -> (Maybe CId -> [Int] -> LinTable -> LinTable) -> Expr -> [LinTable] -linTree pgf lang mark e = lin0 [] [] [] Nothing e +-- | Linearizes given expression as string in all languages +-- available in the grammar. +linearizeAllLang :: PGF -> Tree -> [(Language,String)] +linearizeAllLang pgf t = [(lang,linearize pgf lang t) | lang <- Map.keys (concretes pgf)] + +-- | Linearizes given expression as a bracketed string in the language +bracketedLinearize :: PGF -> Language -> Tree -> BracketedString +bracketedLinearize pgf lang = head . concat . map (snd . untokn "" . (!0)) . linTree pgf lang + +-- | Creates a table from feature name to linearization. +-- The outher list encodes the variations +tabularLinearizes :: PGF -> CId -> Expr -> [[(String,String)]] +tabularLinearizes pgf lang e = map (zip lbls . map (unwords . concatMap flattenBracketedString . snd . untokn "") . elems) + (linTree pgf lang e) + where + lbls = case unApp e of + Just (f,_) -> let cat = valCat (lookType pgf f) + in case Map.lookup cat (cnccats (lookConcr pgf lang)) of + Just (CncCat _ _ lbls) -> elems lbls + Nothing -> error "No labels" + Nothing -> error "Not function application" + +-------------------------------------------------------------------- +-- Implementation +-------------------------------------------------------------------- + +linTree :: PGF -> Language -> Expr -> [Array LIndex BracketedTokn] +linTree pgf lang e = + [amapWithIndex (\label -> Bracket_ fid label cat) lin | (_,(fid,cat,lin)) <- lin0 [] [] Nothing 0 e] where cnc = lookMap (error "no lang") lang (concretes pgf) lp = lproductions cnc - - lin0 path xs ys mb_fid (EAbs _ x e) = lin0 path (showCId x:xs) ys mb_fid e - lin0 path xs ys mb_fid (ETyped e _) = lin0 path xs ys mb_fid e - lin0 path xs ys mb_fid e | null xs = lin path ys mb_fid e [] - | otherwise = apply path (xs ++ ys) mb_fid _B (e:[ELit (LStr x) | x <- xs]) - - lin path xs mb_fid (EApp e1 e2) es = lin path xs mb_fid e1 (e2:es) - lin path xs mb_fid (ELit l) [] = case l of - LStr s -> return (mark Nothing path (ss s)) - LInt n -> return (mark Nothing path (ss (show n))) - LFlt f -> return (mark Nothing path (ss (show f))) - lin path xs mb_fid (EMeta i) es = apply path xs mb_fid _V (ELit (LStr ('?':show i)):es) - lin path xs mb_fid (EFun f) es = map (mark (Just f) path) (apply path xs mb_fid f es) - lin path xs mb_fid (EVar i) es = apply path xs mb_fid _V (ELit (LStr (xs !! i)) :es) - lin path xs mb_fid (ETyped e _) es = lin path xs mb_fid e es - lin path xs mb_fid (EImplArg e) es = lin path xs mb_fid e es - - ss s = listArray (0,0) [[KS s]] - - apply path xs mb_fid f es = + + lin0 xs ys mb_fid n_fid (EAbs _ x e) = lin0 (showCId x:xs) ys mb_fid n_fid e + lin0 xs ys mb_fid n_fid (ETyped e _) = lin0 xs ys mb_fid n_fid e + lin0 xs ys mb_fid n_fid e | null xs = lin ys mb_fid n_fid e [] + | otherwise = apply (xs ++ ys) mb_fid n_fid _B (e:[ELit (LStr x) | x <- xs]) + + lin xs mb_fid n_fid (EApp e1 e2) es = lin xs mb_fid n_fid e1 (e2:es) + lin xs mb_fid n_fid (ELit l) [] = case l of + LStr s -> return (n_fid+1,(n_fid,cidString,ss s)) + LInt n -> return (n_fid+1,(n_fid,cidInt ,ss (show n))) + LFlt f -> return (n_fid+1,(n_fid,cidFloat ,ss (show f))) + lin xs mb_fid n_fid (EMeta i) es = apply xs mb_fid n_fid _V (ELit (LStr ('?':show i)):es) + lin xs mb_fid n_fid (EFun f) es = apply xs mb_fid n_fid f es + lin xs mb_fid n_fid (EVar i) es = apply xs mb_fid n_fid _V (ELit (LStr (xs !! i)) :es) + lin xs mb_fid n_fid (ETyped e _) es = lin xs mb_fid n_fid e es + lin xs mb_fid n_fid (EImplArg e) es = lin xs mb_fid n_fid e es + + ss s = listArray (0,0) [[LeafKS [s]]] + + apply :: [String] -> Maybe FId -> FId -> CId -> [Expr] -> [(FId,(FId, CId, LinTable))] + apply xs mb_fid n_fid f es = case Map.lookup f lp of - Just prods -> case lookupProds mb_fid prods of - Just set -> do prod <- Set.toList set - case prod of - PApply funid fids -> do guard (length fids == length es) - args <- sequence (zipWith3 (\i fid e -> lin0 (sub i path) [] xs (Just fid) e) [0..] fids es) - let (CncFun _ lins) = cncfuns cnc ! funid - return (listArray (bounds lins) [computeSeq seqid args | seqid <- elems lins]) - PCoerce fid -> apply path xs (Just fid) f es - Nothing -> mzero - Nothing -> apply path xs mb_fid _V [ELit (LStr ("[" ++ showCId f ++ "]"))] -- fun without lin + Just prods -> do prod <- lookupProds mb_fid prods + case prod of + PApply funid fids -> do guard (length fids == length es) + (n_fid,args) <- descend n_fid (zip fids es) + let (CncFun fun lins) = cncfuns cnc ! funid + Just (DTyp _ cat _,_,_) = Map.lookup fun (funs (abstract pgf)) + return (n_fid+1,(n_fid,cat,listArray (bounds lins) [computeSeq seqid args | seqid <- elems lins])) + PCoerce fid -> apply xs (Just fid) n_fid f es + Nothing -> apply xs mb_fid n_fid _V [ELit (LStr ("[" ++ showCId f ++ "]"))] -- fun without lin where - lookupProds (Just fid) prods = IntMap.lookup fid prods + lookupProds (Just fid) prods = maybe [] Set.toList (IntMap.lookup fid prods) lookupProds Nothing prods - | f == _B || f == _V = Nothing - | otherwise = Just (Set.filter isApp (Set.unions (IntMap.elems prods))) + | f == _B || f == _V = [] + | otherwise = [prod | (fid,set) <- IntMap.toList prods, prod <- Set.toList set] - sub i path - | f == _B || f == _V = path - | otherwise = i:path + descend n_fid [] = return (n_fid,[]) + descend n_fid ((fid,e):fes) = do (n_fid,xx) <- lin0 [] xs (Just fid) n_fid e + (n_fid,xxs) <- descend n_fid fes + return (n_fid,xx:xxs) isApp (PApply _ _) = True isApp _ = False + computeSeq :: SeqId -> [(FId,CId,LinTable)] -> [BracketedTokn] computeSeq seqid args = concatMap compute (elems seq) where seq = sequences cnc ! seqid - compute (SymCat d r) = (args !! d) ! r - compute (SymLit d r) = (args !! d) ! r - compute (SymKS ts) = map KS ts - compute (SymKP ts alts) = [KP ts alts] - -untokn :: [Tokn] -> [String] -untokn ts = case ts of - KP d _ : [] -> d - KP d vs : ws -> let ss@(s:_) = untokn ws in sel d vs s ++ ss - KS s : ws -> s : untokn ws - [] -> [] - where - sel d vs w = case [v | Alt v cs <- vs, any (\c -> isPrefixOf c w) cs] of - v:_ -> v - _ -> d - --- create a table from labels+params to variants -tabularLinearizes :: PGF -> CId -> Expr -> [[(String,String)]] -tabularLinearizes pgf lang e = map (zip lbls . map (unwords . untokn) . elems) (linTree pgf lang (\_ _ lint -> lint) e) - where - lbls = case unApp e of - Just (f,_) -> let cat = valCat (lookType pgf f) - in case Map.lookup cat (cnccats (lookConcr pgf lang)) of - Just (CncCat _ _ lbls) -> elems lbls - Nothing -> error "No labels" - Nothing -> error "Not function application" + compute (SymCat d r) = getArg d r + compute (SymLit d r) = getArg d r + compute (SymKS ts) = [LeafKS ts] + compute (SymKP ts alts) = [LeafKP ts alts] + getArg d r + | not (null arg_lin) = [Bracket_ fid r cat arg_lin] + | otherwise = arg_lin + where + arg_lin = lin ! r + (fid,cat,lin) = args !! d --- show bracketed markup with references to tree structure -markLinearizes :: PGF -> CId -> Expr -> [String] -markLinearizes pgf lang = map (unwords . untokn . (! 0)) . linTree pgf lang mark - where - mark mb_f path lint = amap (bracket mb_f path) lint - - bracket Nothing path ts = [KS ("("++show (reverse path))] ++ ts ++ [KS ")"] - bracket (Just f) path ts = [KS ("(("++showCId f++","++show (reverse path)++")")] ++ ts ++ [KS ")"] +amapWithIndex :: (IArray a e1, IArray a e2, Ix i) => (i -> e1 -> e2) -> a i e1 -> a i e2 +amapWithIndex f arr = listArray (bounds arr) (map (uncurry f) (assocs arr)) |
