summaryrefslogtreecommitdiff
path: root/src/GF/UseGrammar/Generate.hs
blob: 9f8fb66d1e9705e0f84c44f7cdbf0784f12391a9 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
module Generate where

import GFC
import LookAbs
import PrGrammar
import Macros

import Operations
import List

-- Generate all trees of given category and depth. AR 30/4/2004
-- (c) Aarne Ranta 2004 under GNU GPL
--
-- Purpose: to generate corpora. We use simple types and don't
-- guarantee the correctness of bindings/dependences.


-- the main function takes an abstract syntax and returns a list of trees

-- generateTrees :: GFCGrammar -> Cat -> Int -> Maybe Int -> [Exp]
generateTrees gr cat n mn = map str2tr $ generate gr' cat' n mn where
  gr' = gr2sgr gr
  cat' = prt $ snd cat

------------------------------------------
-- translate grammar to simpler form and generated trees back

gr2sgr :: GFCGrammar -> SGrammar
gr2sgr gr = [(trId f, ty') | (f,ty) <- funRulesOf gr, ty' <- trTy ty] where
  trId = prt . snd
  trTy ty = case catSkeleton ty of
    Ok (mcs,mc) -> [(map trCat mcs, trCat mc)]
    _ -> []
  trCat (m,c) = prt c ---

-- str2tr :: STree -> Exp
str2tr (STr (f,ts)) = mkApp (trId f) (map str2tr ts) where
  trId = cn . zIdent

------------------------------------------
-- do the main thing with a simpler data structure
-- the first Int gives tree depth, the second constrains subtrees
-- chosen for each branch. A small number, such as 2, is a good choice
-- if the depth is large (more than 3)


generate :: SGrammar -> SCat -> Int -> Maybe Int -> [STree]
generate gr cat i mn = [t | (c,t) <- gen 0 [], c == cat] where

  gen :: Int -> [(SCat,STree)] -> [(SCat,STree)]
  gen n cts = if n==i then cts else
    gen (n+1) (nub [(c,STr (f, xs)) | (f,(cs,c)) <- gr, xs <- args cs cts] ++ cts)

  args :: [SCat] -> [(SCat,STree)] -> [[STree]]
  args cs cts = combinations [constr [t | (k,t) <- cts, k == c] | c <- cs]

  constr = maybe id take mn

type SGrammar = [SRule]
type SIdent = String
type SRule = (SFun,SType)
type SType = ([SCat],SCat)
type SCat = SIdent
type SFun = SIdent

newtype STree = STr (SFun,[STree]) deriving (Show,Eq)

------------------------------------------
-- to test

prSTree (STr (f,ts)) = f ++ concat (map pr1 ts) where
  pr1 t@(STr (_,ts)) = ' ' : (if null ts then id else prParenth) (prSTree t)

pSRule :: String -> SRule
pSRule s = case words s of
  f : _ : cs -> (f,(init cs', last cs')) 
    where cs' = [cs !! i | i <- [0,2..length cs - 1]]
  _ -> error $ "not a rule" +++ s

exSgr = map pSRule [
   "Pred   : NP -> VP -> S"
  ,"Compl  : TV -> NP -> VP" 
  ,"PredVV : VV -> VP -> VP"
  ,"DefCN  : CN -> NP"
  ,"ModCN  : AP -> CN -> CN" 
  ,"john   : NP"
  ,"walk   : VP"
  ,"love   : TV"
  ,"try    : VV"
  ,"girl   : CN"
  ,"big    : AP"
  ]