summaryrefslogtreecommitdiff
path: root/src/GF/GFCC/Generate.hs
diff options
context:
space:
mode:
authoraarne <aarne@cs.chalmers.se>2007-10-04 21:38:59 +0000
committeraarne <aarne@cs.chalmers.se>2007-10-04 21:38:59 +0000
commit48ebf562b9bfcacff7c0fabeaa5892f31ddd3e1c (patch)
tree7c39399a32dd7b66e9921118de61e9246468944d /src/GF/GFCC/Generate.hs
parentacc32ec199694c0e57df9f4a1f2273d166b88be4 (diff)
new GFCC format in GF/GFCC
Diffstat (limited to 'src/GF/GFCC/Generate.hs')
-rw-r--r--src/GF/GFCC/Generate.hs79
1 files changed, 79 insertions, 0 deletions
diff --git a/src/GF/GFCC/Generate.hs b/src/GF/GFCC/Generate.hs
new file mode 100644
index 000000000..758e96d8c
--- /dev/null
+++ b/src/GF/GFCC/Generate.hs
@@ -0,0 +1,79 @@
+module GF.GFCC.Generate where
+
+import GF.GFCC.DataGFCC
+import GF.GFCC.AbsGFCC
+
+import qualified Data.Map as M
+import System.Random
+
+-- generate an infinite list of trees exhaustively
+generate :: GFCC -> CId -> [Exp]
+generate gfcc cat = concatMap (\i -> gener i cat) [0..]
+ where
+ gener 0 c = [Tr (AC f) [] | (f, Typ [] _) <- fns c]
+ gener i c = [
+ tr |
+ (f, Typ cs _) <- fns c,
+ let alts = map (gener (i-1)) cs,
+ ts <- combinations alts,
+ let tr = Tr (AC f) ts,
+ depth tr >= i
+ ]
+ fns cat =
+ let fs = lookMap [] cat $ catfuns $ abstract gfcc
+ in [(f,ty) | f <- fs, Just (ty,_) <- [M.lookup f $ funs $ abstract gfcc]]
+ depth tr = case tr of
+ Tr _ [] -> 1
+ Tr _ ts -> maximum (map depth ts) + 1
+
+--- from Operations
+combinations :: [[a]] -> [[a]]
+combinations t = case t of
+ [] -> [[]]
+ aa:uu -> [a:u | a <- aa, u <- combinations uu]
+
+-- generate an infinite list of trees randomly
+genRandom :: StdGen -> GFCC -> CId -> [Exp]
+genRandom gen gfcc cat = genTrees (randomRs (0.0, 1.0) gen) cat where
+
+ timeout = 47 -- give up
+
+ genTrees ds0 cat =
+ let (ds,ds2) = splitAt (timeout+1) ds0 -- for time out, else ds
+ (t,k) = genTree ds cat
+ in (if k>timeout then id else (t:))
+ (genTrees ds2 cat) -- else (drop k ds)
+
+ genTree rs = gett rs where
+ gett ds (CId "String") = (Tr (AS "foo") [], 1)
+ gett ds (CId "Int") = (Tr (AI 12345) [], 1)
+ gett [] _ = (Tr (AS "TIMEOUT") [], 1) ----
+ gett ds cat = case fns cat of
+ [] -> (Tr (AM 0) [],1)
+ fs -> let
+ d:ds2 = ds
+ (f,args) = getf d fs
+ (ts,k) = getts ds2 args
+ in (Tr (AC f) ts, k+1)
+ getf d fs = let lg = (length fs) in
+ fs !! (floor (d * fromIntegral lg))
+ getts ds cats = case cats of
+ c:cs -> let
+ (t, k) = gett ds c
+ (ts,ks) = getts (drop k ds) cs
+ in (t:ts, k + ks)
+ _ -> ([],0)
+
+ fns cat =
+ let fs = maybe [] id $ M.lookup cat $ catfuns $ abstract gfcc
+ in [(f,cs) | f <- fs,
+ Just (Typ cs _,_) <- [M.lookup f $ funs $ abstract gfcc]]
+
+-- brute-force parsing method; only returns the first result
+-- note: you cannot throw away rules with unknown words from the grammar
+-- because it is not known which field in each rule may match the input
+
+searchParse :: Int -> GFCC -> CId -> [String] -> [Exp]
+searchParse i gfcc cat ws = [t | t <- gen, s <- lins t, words s == ws] where
+ gen = take i $ generate gfcc cat
+ lins t = [linearize gfcc lang t | lang <- cncnames gfcc]