summaryrefslogtreecommitdiff
path: root/src/compiler/GF/Command
diff options
context:
space:
mode:
Diffstat (limited to 'src/compiler/GF/Command')
-rw-r--r--src/compiler/GF/Command/Commands2.hs1425
1 files changed, 1425 insertions, 0 deletions
diff --git a/src/compiler/GF/Command/Commands2.hs b/src/compiler/GF/Command/Commands2.hs
new file mode 100644
index 000000000..0c9315f1d
--- /dev/null
+++ b/src/compiler/GF/Command/Commands2.hs
@@ -0,0 +1,1425 @@
+{-# LANGUAGE PatternGuards, TypeSynonymInstances, FlexibleInstances #-}
+module GF.Command.Commands2 (
+ PGFEnv,pgfEnv,emptyPGFEnv,allCommands,
+ options, flags,
+ ) where
+import Prelude hiding (putStrLn)
+
+import qualified PGF2 as C
+import qualified PGF as H
+
+--import qualified PGF.Internal as H(lookStartCat,functionsToCat,lookValCat,restrictPGF,hasLin)
+--import qualified PGF.Internal as H(abstract,funs,cats,Expr(EFun)) ----
+--import qualified PGF.Internal as H(Literal(LStr),Expr(ELit)) ----
+--import qualified PGF.Internal as H(ppFun,ppCat)
+
+--import qualified PGF.Internal as H(optimizePGF)
+
+--import GF.Compile.Export
+--import GF.Compile.ToAPI
+--import GF.Compile.ExampleBased
+--import GF.Infra.Option (noOptions, readOutputFormat, outputFormatsExpl)
+import GF.Infra.UseIO(writeUTF8File)
+import GF.Infra.SIO
+--import GF.Data.ErrM ----
+import GF.Command.Abstract
+--import GF.Command.Messages
+import GF.Command.CommandInfo
+import GF.Command.Help
+import GF.Text.Lexing
+--import GF.Text.Clitics
+import GF.Text.Transliterations
+--import GF.Quiz
+
+--import GF.Command.TreeOperations ---- temporary place for typecheck and compute
+
+import GF.Data.Operations
+
+--import PGF.Internal (encodeFile)
+--import Data.List(intersperse,nub)
+import Data.Maybe
+import qualified Data.Map as Map
+--import System.Cmd(system) -- use GF.Infra.UseIO.restricedSystem instead!
+import GF.System.Process
+import GF.Text.Pretty
+import Data.List (sort)
+import Control.Monad(mplus)
+--import Debug.Trace
+--import System.Random (newStdGen) ----
+
+
+type PGFEnv = (Maybe C.PGF, Map.Map C.ConcName C.Concr)
+
+pgfEnv pgf = (Just pgf,C.languages pgf) :: PGFEnv
+emptyPGFEnv = (Nothing,Map.empty) :: PGFEnv
+
+instance TypeCheckArg PGFEnv where
+ typeCheckArg env e = Right e -- no type checker available !!
+
+
+-- this list must no more be kept sorted by the command name
+allCommands :: Map.Map String (CommandInfo PGFEnv)
+allCommands = Map.fromList [
+ ("!", emptyCommandInfo {
+ synopsis = "system command: escape to system shell",
+ syntax = "! SYSTEMCOMMAND",
+ examples = [
+ ("! ls *.gf", "list all GF files in the working directory")
+ ],
+ needsTypeCheck = False
+ }),
+ ("?", emptyCommandInfo {
+ synopsis = "system pipe: send value from previous command to a system command",
+ syntax = "? SYSTEMCOMMAND",
+ examples = [
+ ("gt | l | ? wc", "generate, linearize, word-count")
+ ],
+ needsTypeCheck = False
+ }),
+{-
+ ("aw", emptyCommandInfo {
+ longname = "align_words",
+ synopsis = "show word alignments between languages graphically",
+ explanation = unlines [
+ "Prints a set of strings in the .dot format (the graphviz format).",
+ "The graph can be saved in a file by the wf command as usual.",
+ "If the -view flag is defined, the graph is saved in a temporary file",
+ "which is processed by graphviz and displayed by the program indicated",
+ "by the flag. The target format is postscript, unless overridden by the",
+ "flag -format."
+ ],
+ exec = \env@(pgf, mos) opts es -> do
+ let langs = optLangs pgf opts
+ if isOpt "giza" opts
+ then do
+ let giz = map (H.gizaAlignment pgf (head $ langs, head $ tail $ langs)) es
+ let lsrc = unlines $ map (\(x,_,_) -> x) giz
+ let ltrg = unlines $ map (\(_,x,_) -> x) giz
+ let align = unlines $ map (\(_,_,x) -> x) giz
+ let grph = if null es then [] else lsrc ++ "\n--end_source--\n\n"++ltrg++"\n-end_target--\n\n"++align
+ return $ fromString grph
+ else do
+ let grph = if null es then [] else H.graphvizAlignment pgf langs (head es)
+ if isFlag "view" opts || isFlag "format" opts
+ then do
+ let file s = "_grph." ++ s
+ let view = optViewGraph opts
+ let format = optViewFormat opts
+ restricted $ writeUTF8File (file "dot") grph
+ restrictedSystem $ "dot -T" ++ format ++ " " ++ file "dot" ++ " > " ++ file format
+ restrictedSystem $ view ++ " " ++ file format
+ return void
+ else return $ fromString grph,
+ examples = [
+ ("gr | aw" , "generate a tree and show word alignment as graph script"),
+ ("gr | aw -view=\"open\"" , "generate a tree and display alignment on Mac"),
+ ("gr | aw -view=\"eog\"" , "generate a tree and display alignment on Ubuntu"),
+ ("gt | aw -giza | wf -file=aligns" , "generate trees, send giza alignments to file")
+ ],
+ options = [
+ ("giza", "show alignments in the Giza format; the first two languages")
+ ],
+ flags = [
+ ("format","format of the visualization file (default \"png\")"),
+ ("lang", "alignments for this list of languages (default: all)"),
+ ("view", "program to open the resulting file")
+ ]
+ }),
+
+ ("ca", emptyCommandInfo {
+ longname = "clitic_analyse",
+ synopsis = "print the analyses of all words into stems and clitics",
+ explanation = unlines [
+ "Analyses all words into all possible combinations of stem + clitics.",
+ "The analysis is returned in the format stem &+ clitic1 &+ clitic2 ...",
+ "which is hence the inverse of 'pt -bind'. The list of clitics is give",
+ "by the flag '-clitics'. The list of stems is given as the list of words",
+ "of the language given by the '-lang' flag."
+ ],
+ exec = \env opts -> case opts of
+ _ | isOpt "raw" opts ->
+ return . fromString .
+ unlines . map (unwords . map (concat . intersperse "+")) .
+ map (getClitics (H.isInMorpho (optMorpho env opts)) (optClitics opts)) .
+ concatMap words . toStrings
+ _ ->
+ return . fromStrings .
+ getCliticsText (H.isInMorpho (optMorpho env opts)) (optClitics opts) .
+ concatMap words . toStrings,
+ flags = [
+ ("clitics","the list of possible clitics (comma-separated, no spaces)"),
+ ("lang", "the language of analysis")
+ ],
+ options = [
+ ("raw", "analyse each word separately (not suitable input for parser)")
+ ],
+ examples = [
+ mkEx "ca -lang=Fin -clitics=ko,ni \"nukkuuko minun vaimoni\" | p -- to parse Finnish"
+ ]
+ }),
+
+ ("cc", emptyCommandInfo {
+ longname = "compute_concrete",
+ syntax = "cc (-all | -table | -unqual)? TERM",
+ synopsis = "computes concrete syntax term using a source grammar",
+ explanation = unlines [
+ "Compute TERM by concrete syntax definitions. Uses the topmost",
+ "module (the last one imported) to resolve constant names.",
+ "N.B.1 You need the flag -retain when importing the grammar, if you want",
+ "the definitions to be retained after compilation.",
+ "N.B.2 The resulting term is not a tree in the sense of abstract syntax",
+ "and hence not a valid input to a Tree-expecting command.",
+ "This command must be a line of its own, and thus cannot be a part",
+ "of a pipe."
+ ],
+ options = [
+ ("all","pick all strings (forms and variants) from records and tables"),
+ ("list","all strings, comma-separated on one line"),
+ ("one","pick the first strings, if there is any, from records and tables"),
+ ("table","show all strings labelled by parameters"),
+ ("unqual","hide qualifying module names")
+ ],
+ needsTypeCheck = False
+ }),
+-}
+ ("dc", emptyCommandInfo {
+ longname = "define_command",
+ syntax = "dc IDENT COMMANDLINE",
+ synopsis = "define a command macro",
+ explanation = unlines [
+ "Defines IDENT as macro for COMMANDLINE, until IDENT gets redefined.",
+ "A call of the command has the form %IDENT. The command may take an",
+ "argument, which in COMMANDLINE is marked as ?0. Both strings and",
+ "trees can be arguments. Currently at most one argument is possible.",
+ "This command must be a line of its own, and thus cannot be a part",
+ "of a pipe."
+ ],
+ needsTypeCheck = False
+ }),
+{-
+ ("dg", emptyCommandInfo {
+ longname = "dependency_graph",
+ syntax = "dg (-only=MODULES)?",
+ synopsis = "print module dependency graph",
+ explanation = unlines [
+ "Prints the dependency graph of source modules.",
+ "Requires that import has been done with the -retain flag.",
+ "The graph is written in the file _gfdepgraph.dot",
+ "which can be further processed by Graphviz (the system command 'dot').",
+ "By default, all modules are shown, but the -only flag restricts them",
+ "by a comma-separated list of patterns, where 'name*' matches modules",
+ "whose name has prefix 'name', and other patterns match modules with",
+ "exactly the same name. The graphical conventions are:",
+ " solid box = abstract, solid ellipse = concrete, dashed ellipse = other",
+ " solid arrow empty head = of, solid arrow = **, dashed arrow = open",
+ " dotted arrow = other dependency"
+ ],
+ flags = [
+ ("only","list of modules included (default: all), literally or by prefix*")
+ ],
+ examples = [
+ mkEx "dg -only=SyntaxEng,Food* -- shows only SyntaxEng, and those with prefix Food"
+ ],
+ needsTypeCheck = False
+ }),
+-}
+ ("dt", emptyCommandInfo {
+ longname = "define_tree",
+ syntax = "dt IDENT (TREE | STRING | \"<\" COMMANDLINE)",
+ synopsis = "define a tree or string macro",
+ explanation = unlines [
+ "Defines IDENT as macro for TREE or STRING, until IDENT gets redefined.",
+ "The defining value can also come from a command, preceded by \"<\".",
+ "If the command gives many values, the first one is selected.",
+ "A use of the macro has the form %IDENT. Currently this use cannot be",
+ "a subtree of another tree. This command must be a line of its own",
+ "and thus cannot be a part of a pipe."
+ ],
+ examples = [
+ mkEx ("dt ex \"hello world\" -- define ex as string"),
+ mkEx ("dt ex UseN man_N -- define ex as string"),
+ mkEx ("dt ex < p -cat=NP \"the man in the car\" -- define ex as parse result"),
+ mkEx ("l -lang=LangSwe %ex | ps -to_utf8 -- linearize the tree ex")
+ ],
+ needsTypeCheck = False
+ }),
+ ("e", emptyCommandInfo {
+ longname = "empty",
+ synopsis = "empty the environment"
+ }),
+{-
+ ("eb", emptyCommandInfo {
+ longname = "example_based",
+ syntax = "eb (-probs=FILE | -lang=LANG)* -file=FILE.gfe",
+ synopsis = "converts .gfe files to .gf files by parsing examples to trees",
+ explanation = unlines [
+ "Reads FILE.gfe and writes FILE.gf. Each expression of form",
+ "'%ex CAT QUOTEDSTRING' in FILE.gfe is replaced by a syntax tree.",
+ "This tree is the first one returned by the parser; a biased ranking",
+ "can be used to regulate the order. If there are more than one parses",
+ "the rest are shown in comments, with probabilities if the order is biased.",
+ "The probabilities flag and configuration file is similar to the commands",
+ "gr and rt. Notice that the command doesn't change the environment,",
+ "but the resulting .gf file must be imported separately."
+ ],
+ options = [
+ ("api","convert trees to overloaded API expressions (using Syntax not Lang)")
+ ],
+ flags = [
+ ("file","the file to be converted (suffix .gfe must be given)"),
+ ("lang","the language in which to parse"),
+ ("probs","file with probabilities to rank the parses")
+ ],
+ exec = \env@(pgf, mos) opts _ -> do
+ let file = optFile opts
+ pgf <- optProbs opts pgf
+ let printer = if (isOpt "api" opts) then exprToAPI else (H.showExpr [])
+ let conf = configureExBased pgf (optMorpho env opts) (optLang pgf opts) printer
+ (file',ws) <- restricted $ parseExamplesInGrammar conf file
+ if null ws then return () else putStrLn ("unknown words: " ++ unwords ws)
+ return (fromString ("wrote " ++ file')),
+ needsTypeCheck = False
+ }),
+-}
+{-
+ ("gr", emptyCommandInfo {
+ longname = "generate_random",
+ synopsis = "generate random trees in the current abstract syntax",
+ syntax = "gr [-cat=CAT] [-number=INT]",
+ examples = [
+ mkEx "gr -- one tree in the startcat of the current grammar",
+ mkEx "gr -cat=NP -number=16 -- 16 trees in the category NP",
+ mkEx "gr -lang=LangHin,LangTha -cat=Cl -- Cl, both in LangHin and LangTha",
+ mkEx "gr -probs=FILE -- generate with bias",
+ mkEx "gr (AdjCN ? (UseN ?)) -- generate trees of form (AdjCN ? (UseN ?))"
+ ],
+ explanation = unlines [
+ "Generates a list of random trees, by default one tree.",
+ "If a tree argument is given, the command completes the Tree with values to",
+ "all metavariables in the tree. The generation can be biased by probabilities,",
+ "given in a file in the -probs flag."
+ ],
+ flags = [
+ ("cat","generation category"),
+ ("lang","uses only functions that have linearizations in all these languages"),
+ ("number","number of trees generated"),
+ ("depth","the maximum generation depth"),
+ ("probs", "file with biased probabilities (format 'f 0.4' one by line)")
+ ],
+ exec = \env@(pgf, mos) opts xs -> do
+ pgf <- optProbs opts (optRestricted opts pgf)
+ gen <- newStdGen
+ let dp = valIntOpts "depth" 4 opts
+ let ts = case mexp xs of
+ Just ex -> H.generateRandomFromDepth gen pgf ex (Just dp)
+ Nothing -> H.generateRandomDepth gen pgf (optType pgf opts) (Just dp)
+ returnFromExprs $ take (optNum opts) ts
+ }),
+-}
+ ("ga", emptyCommandInfo {
+ longname = "generate_all",
+ synopsis = "generate a list of all trees",
+ flags = [("cat","the generation category"),
+ ("number","the number of trees generated")],
+ examples = [
+ mkEx "ga -- all trees in the startcat",
+ mkEx "ga -cat=NP -number=16 -- 16 trees in the category NP"],
+ exec = needPGF $ \ env@(pgf,_) opts _ ->
+ let ts = map fst (C.generateAll pgf cat)
+ cat = optCat pgf opts
+ in returnFromCExprs (takeOptNum opts ts),
+ needsTypeCheck = False
+ }),
+{-
+ ("gt", emptyCommandInfo {
+ longname = "generate_trees",
+ synopsis = "generates a list of trees, by default exhaustive",
+ explanation = unlines [
+ "Generates all trees of a given category. By default, ",
+ "the depth is limited to 4, but this can be changed by a flag.",
+ "If a Tree argument is given, the command completes the Tree with values",
+ "to all metavariables in the tree."
+ ],
+ flags = [
+ ("cat","the generation category"),
+ ("depth","the maximum generation depth"),
+ ("lang","excludes functions that have no linearization in this language"),
+ ("number","the number of trees generated")
+ ],
+ examples = [
+ mkEx "gt -- all trees in the startcat, to depth 4",
+ mkEx "gt -cat=NP -number=16 -- 16 trees in the category NP",
+ mkEx "gt -cat=NP -depth=2 -- trees in the category NP to depth 2",
+ mkEx "gt (AdjCN ? (UseN ?)) -- trees of form (AdjCN ? (UseN ?))"
+ ],
+ exec = \env@(pgf, mos) opts xs -> do
+ let pgfr = optRestricted opts pgf
+ let dp = valIntOpts "depth" 4 opts
+ let ts = case mexp xs of
+ Just ex -> H.generateFromDepth pgfr ex (Just dp)
+ Nothing -> H.generateAllDepth pgfr (optType pgf opts) (Just dp)
+ returnFromExprs $ take (optNumInf opts) ts
+ }),
+-}
+ helpCommand allCommands,
+ ("i", emptyCommandInfo {
+ longname = "import",
+ synopsis = "import a grammar from source code or compiled .pgf file",
+ explanation = unlines [
+ "Reads a grammar from File and compiles it into a GF runtime grammar.",
+ "If its abstract is different from current state, old modules are discarded.",
+ "If its abstract is the same and a concrete with the same name is already in the state",
+ "it is overwritten - but only if compilation succeeds.",
+ "The grammar parser depends on the file name suffix:",
+ " .cf context-free (labelled BNF) source",
+ " .ebnf extended BNF source",
+ " .gfm multi-module GF source",
+ " .gf normal GF source",
+ " .gfo compiled GF source",
+ " .pgf precompiled grammar in Portable Grammar Format"
+ ],
+ flags = [
+ ("probs","file with biased probabilities for generation")
+ ],
+ options = [
+ -- ["gfo", "src", "no-cpu", "cpu", "quiet", "verbose"]
+ ("retain","retain operations (used for cc command)"),
+ ("src", "force compilation from source"),
+ ("v", "be verbose - show intermediate status information")
+ ],
+ needsTypeCheck = False
+ }),
+ ("l", emptyCommandInfo {
+ longname = "linearize",
+ synopsis = "convert an abstract syntax expression to string",
+ explanation = unlines [
+ "Shows the linearization of a Tree by the grammars in scope.",
+ "The -lang flag can be used to restrict this to fewer languages."],
+ flags = [
+ ("lang","the languages of linearization (comma-separated, no spaces)")
+ ],
+ examples = [
+ mkEx "l -lang=LangSwe,LangNor no_Utt -- linearize tree to LangSwe and LangNor"],
+ exec = needPGF $ \ env opts ->
+ return . fromStrings . cLins env opts . map cExpr
+ }),
+{-
+ ("l", emptyCommandInfo {
+ longname = "linearize",
+ synopsis = "convert an abstract syntax expression to string",
+ explanation = unlines [
+ "Shows the linearization of a Tree by the grammars in scope.",
+ "The -lang flag can be used to restrict this to fewer languages.",
+ "A sequence of string operations (see command ps) can be given",
+ "as options, and works then like a pipe to the ps command, except",
+ "that it only affect the strings, not e.g. the table labels.",
+ "These can be given separately to each language with the unlexer flag",
+ "whose results are prepended to the other lexer flags. The value of the",
+ "unlexer flag is a space-separated list of comma-separated string operation",
+ "sequences; see example."
+ ],
+ examples = [
+ mkEx "l -lang=LangSwe,LangNor no_Utt -- linearize tree to LangSwe and LangNor",
+ mkEx "gr -lang=LangHin -cat=Cl | l -table -to_devanagari -- hindi table",
+ mkEx "l -unlexer=\"LangAra=to_arabic LangHin=to_devanagari\" -- different unlexers"
+ ],
+ exec = \env@(pgf, mos) opts -> return . fromStrings . optLins pgf opts,
+ options = [
+ ("all", "show all forms and variants, one by line (cf. l -list)"),
+ ("bracket","show tree structure with brackets and paths to nodes"),
+ ("groups", "all languages, grouped by lang, remove duplicate strings"),
+ ("list","show all forms and variants, comma-separated on one line (cf. l -all)"),
+ ("multi","linearize to all languages (default)"),
+ ("table","show all forms labelled by parameters"),
+ ("treebank","show the tree and tag linearizations with language names")
+ ] ++ stringOpOptions,
+ flags = [
+ ("lang","the languages of linearization (comma-separated, no spaces)"),
+ ("unlexer","set unlexers separately to each language (space-separated)")
+ ]
+ }),
+-}
+{-
+ ("lc", emptyCommandInfo {
+ longname = "linearize_chunks",
+ synopsis = "linearize a tree that has metavariables in maximal chunks without them",
+ explanation = unlines [
+ "A hopefully temporary command, intended to work around the type checker that fails",
+ "trees where a function node is a metavariable."
+ ],
+ examples = [
+ mkEx "l -lang=LangSwe,LangNor -chunks ? a b (? c d)"
+ ],
+ exec = \env@(pgf, mos) opts -> return . fromStrings . optLins pgf (opts ++ [OOpt "chunks"]),
+ options = [
+ ("treebank","show the tree and tag linearizations with language names")
+ ] ++ stringOpOptions,
+ flags = [
+ ("lang","the languages of linearization (comma-separated, no spaces)")
+ ],
+ needsTypeCheck = False
+ }),
+-}
+{-
+ ("ma", emptyCommandInfo {
+ longname = "morpho_analyse",
+ synopsis = "print the morphological analyses of all words in the string",
+ explanation = unlines [
+ "Prints all the analyses of space-separated words in the input string,",
+ "using the morphological analyser of the actual grammar (see command pg)"
+ ],
+ exec = \env opts -> case opts of
+ _ | isOpt "missing" opts ->
+ return . fromString . unwords .
+ H.morphoMissing (optMorpho env opts) .
+ concatMap words . toStrings
+ _ | isOpt "known" opts ->
+ return . fromString . unwords .
+ H.morphoKnown (optMorpho env opts) .
+ concatMap words . toStrings
+ _ -> return . fromString . unlines .
+ map prMorphoAnalysis . concatMap (morphos env opts) .
+ concatMap words . toStrings ,
+ flags = [
+ ("lang","the languages of analysis (comma-separated, no spaces)")
+ ],
+ options = [
+ ("known", "return only the known words, in order of appearance"),
+ ("missing","show the list of unknown words, in order of appearance")
+ ]
+ }),
+ ("mq", emptyCommandInfo {
+ longname = "morpho_quiz",
+ synopsis = "start a morphology quiz",
+ syntax = "mq (-cat=CAT)? (-probs=FILE)? TREE?",
+ exec = \env@(pgf, mos) opts xs -> do
+ let lang = optLang pgf opts
+ let typ = optType pgf opts
+ pgf <- optProbs opts pgf
+ let mt = mexp xs
+ restricted $ morphologyQuiz mt pgf lang typ
+ return void,
+ flags = [
+ ("lang","language of the quiz"),
+ ("cat","category of the quiz"),
+ ("number","maximum number of questions"),
+ ("probs","file with biased probabilities for generation")
+ ]
+ }),
+-}
+ ("p", emptyCommandInfo {
+ longname = "parse",
+ synopsis = "parse a string to abstract syntax expression",
+ explanation = unlines [
+ "Shows all trees returned by parsing a string in the grammars in scope.",
+ "The -lang flag can be used to restrict this to fewer languages.",
+ "The default start category can be overridden by the -cat flag.",
+ "See also the ps command for lexing and character encoding."
+ ],
+ flags = [
+ ("cat","target category of parsing"),
+ ("lang","the languages of parsing (comma-separated, no spaces)"),
+ ("number","maximum number of trees returned")
+ ],
+ examples = [
+ mkEx "p \"this fish is fresh\" | l -lang=Swe -- try parsing with all languages and translate the successful parses to Swedish"
+ ],
+ exec = needPGF $ \ env opts -> return . cParse env opts . toStrings
+ }),
+{-
+ ("p", emptyCommandInfo {
+ longname = "parse",
+ synopsis = "parse a string to abstract syntax expression",
+ explanation = unlines [
+ "Shows all trees returned by parsing a string in the grammars in scope.",
+ "The -lang flag can be used to restrict this to fewer languages.",
+ "The default start category can be overridden by the -cat flag.",
+ "See also the ps command for lexing and character encoding.",
+ "",
+ "The -openclass flag is experimental and allows some robustness in ",
+ "the parser. For example if -openclass=\"A,N,V\" is given, the parser",
+ "will accept unknown adjectives, nouns and verbs with the resource grammar."
+ ],
+ exec = \env@(pgf, mos) opts ts ->
+ return . Piped $ fromParse opts (concat [map ((,) s) (par pgf opts s) | s <- toStrings ts]),
+ flags = [
+ ("cat","target category of parsing"),
+ ("lang","the languages of parsing (comma-separated, no spaces)"),
+ ("openclass","list of open-class categories for robust parsing"),
+ ("depth","maximal depth for proof search if the abstract syntax tree has meta variables")
+ ],
+ options = [
+ ("bracket","prints the bracketed string from the parser")
+ ]
+ }),
+-}
+{-
+ ("pg", emptyCommandInfo { -----
+ longname = "print_grammar",
+ synopsis = "print the actual grammar with the given printer",
+ explanation = unlines [
+ "Prints the actual grammar, with all involved languages.",
+ "In some printers, this can be restricted to a subset of languages",
+ "with the -lang=X,Y flag (comma-separated, no spaces).",
+ "The -printer=P flag sets the format in which the grammar is printed.",
+ "N.B.1 Since grammars are compiled when imported, this command",
+ "generally shows a grammar that looks rather different from the source.",
+ "N.B.2 Another way to produce different formats is to use 'gf -make',",
+ "the batch compiler. The following values are available both for",
+ "the batch compiler (flag -output-format) and the print_grammar",
+ "command (flag -printer):",
+ ""
+ ] ++ unlines (sort [
+ " " ++ opt ++ "\t\t" ++ expl |
+ ((opt,_),expl) <- outputFormatsExpl, take 1 expl /= "*"
+ ]),
+ exec = \env opts _ -> prGrammar env opts,
+ flags = [
+ --"cat",
+ ("file", "set the file name when printing with -pgf option"),
+ ("lang", "select languages for the some options (default all languages)"),
+ ("printer","select the printing format (see flag values above)")
+ ],
+ options = [
+ ("cats", "show just the names of abstract syntax categories"),
+ ("fullform", "print the fullform lexicon"),
+ ("funs", "show just the names and types of abstract syntax functions"),
+ ("langs", "show just the names of top concrete syntax modules"),
+ ("lexc", "print the lexicon in Xerox LEXC format"),
+ ("missing","show just the names of functions that have no linearization"),
+ ("opt", "optimize the generated pgf"),
+ ("pgf", "write current pgf image in file"),
+ ("words", "print the list of words")
+ ],
+ examples = [
+ mkEx ("pg -funs | ? grep \" S ;\" -- show functions with value cat S")
+ ]
+ }),
+-}
+ ("ph", emptyCommandInfo {
+ longname = "print_history",
+ synopsis = "print command history",
+ explanation = unlines [
+ "Prints the commands issued during the GF session.",
+ "The result is readable by the eh command.",
+ "The result can be used as a script when starting GF."
+ ],
+ examples = [
+ mkEx "ph | wf -file=foo.gfs -- save the history into a file"
+ ]
+ }),
+ ("ps", emptyCommandInfo {
+ longname = "put_string",
+ syntax = "ps OPT? STRING",
+ synopsis = "return a string, possibly processed with a function",
+ explanation = unlines [
+ "Returns a string obtained from its argument string by applying",
+ "string processing functions in the order given in the command line",
+ "option list. Thus 'ps -f -g s' returns g (f s). Typical string processors",
+ "are lexers and unlexers, but also character encoding conversions are possible.",
+ "The unlexers preserve the division of their input to lines.",
+ "To see transliteration tables, use command ut."
+ ],
+ examples = [
+ mkEx "l (EAdd 3 4) | ps -code -- linearize code-like output",
+ mkEx "ps -lexer=code | p -cat=Exp -- parse code-like input",
+ mkEx "gr -cat=QCl | l | ps -bind -- linearization output from LangFin",
+ mkEx "ps -to_devanagari \"A-p\" -- show Devanagari in UTF8 terminal",
+ mkEx "rf -file=Hin.gf | ps -env=quotes -to_devanagari -- convert translit to UTF8",
+ mkEx "rf -file=Ara.gf | ps -from_utf8 -env=quotes -from_arabic -- convert UTF8 to transliteration",
+ mkEx "ps -to=chinese.trans \"abc\" -- apply transliteration defined in file chinese.trans"
+ ],
+ exec = \_ opts x -> do
+ let (os,fs) = optsAndFlags opts
+ trans <- optTranslit opts
+
+ if isOpt "lines" opts
+ then return $ fromStrings $ map (trans . stringOps (envFlag fs) (map prOpt os)) $ toStrings x
+ else return ((fromString . trans . stringOps (envFlag fs) (map prOpt os) . toString) x),
+ options = [
+ ("lines","apply the operation separately to each input line, returning a list of lines")
+ ] ++
+ stringOpOptions,
+ flags = [
+ ("env","apply in this environment only"),
+ ("from","backward-apply transliteration defined in this file (format 'unicode translit' per line)"),
+ ("to", "forward-apply transliteration defined in this file")
+ ]
+ }),
+ ("tt", emptyCommandInfo {
+ longname = "to_trie",
+ syntax = "to_trie",
+ synopsis = "combine a list of trees into a trie",
+ exec = \ _ _ -> return . fromString . trie
+ }),
+{-
+ ("pt", emptyCommandInfo {
+ longname = "put_tree",
+ syntax = "pt OPT? TREE",
+ synopsis = "return a tree, possibly processed with a function",
+ explanation = unlines [
+ "Returns a tree obtained from its argument tree by applying",
+ "tree processing functions in the order given in the command line",
+ "option list. Thus 'pt -f -g s' returns g (f s). Typical tree processors",
+ "are type checking and semantic computation."
+ ],
+ examples = [
+ mkEx "pt -compute (plus one two) -- compute value",
+ mkEx "p \"4 dogs love 5 cats\" | pt -transfer=digits2numeral | l -- four...five..."
+ ],
+ exec = \env@(pgf, mos) opts ->
+ returnFromExprs . takeOptNum opts . treeOps pgf opts,
+ options = treeOpOptions undefined{-pgf-},
+ flags = [("number","take at most this many trees")] ++ treeOpFlags undefined{-pgf-}
+ }),
+-}
+ ("q", emptyCommandInfo {
+ longname = "quit",
+ synopsis = "exit GF interpreter"
+ }),
+ ("r", emptyCommandInfo {
+ longname = "reload",
+ synopsis = "repeat the latest import command"
+ }),
+{-
+ ("rf", emptyCommandInfo {
+ longname = "read_file",
+ synopsis = "read string or tree input from a file",
+ explanation = unlines [
+ "Reads input from file. The filename must be in double quotes.",
+ "The input is interpreted as a string by default, and can hence be",
+ "piped e.g. to the parse command. The option -tree interprets the",
+ "input as a tree, which can be given e.g. to the linearize command.",
+ "The option -lines will result in a list of strings or trees, one by line."
+ ],
+ options = [
+ ("lines","return the list of lines, instead of the singleton of all contents"),
+ ("tree","convert strings into trees")
+ ],
+ exec = \env@(pgf, mos) opts _ -> do
+ let file = valStrOpts "file" "_gftmp" opts
+ let exprs [] = ([],empty)
+ exprs ((n,s):ls) | null s
+ = exprs ls
+ exprs ((n,s):ls) = case H.readExpr s of
+ Just e -> let (es,err) = exprs ls
+ in case H.inferExpr pgf e of
+ Right (e,t) -> (e:es,err)
+ Left tcerr -> (es,"on line" <+> n <> ':' $$ nest 2 (H.ppTcError tcerr) $$ err)
+ Nothing -> let (es,err) = exprs ls
+ in (es,"on line" <+> n <> ':' <+> "parse error" $$ err)
+ returnFromLines ls = case exprs ls of
+ (es, err) | null es -> return $ pipeMessage $ render (err $$ "no trees found")
+ | otherwise -> return $ pipeWithMessage es (render err)
+
+ s <- restricted $ readFile file
+ case opts of
+ _ | isOpt "lines" opts && isOpt "tree" opts ->
+ returnFromLines (zip [1::Int ..] (lines s))
+ _ | isOpt "tree" opts ->
+ returnFromLines [(1::Int,s)]
+ _ | isOpt "lines" opts -> return (fromStrings $ lines s)
+ _ -> return (fromString s),
+ flags = [("file","the input file name")]
+ }),
+
+ ("rt", emptyCommandInfo {
+ longname = "rank_trees",
+ synopsis = "show trees in an order of decreasing probability",
+ explanation = unlines [
+ "Order trees from the most to the least probable, using either",
+ "even distribution in each category (default) or biased as specified",
+ "by the file given by flag -probs=FILE, where each line has the form",
+ "'function probability', e.g. 'youPol_Pron 0.01'."
+ ],
+ exec = \env@(pgf, mos) opts ts -> do
+ pgf <- optProbs opts pgf
+ let tds = H.rankTreesByProbs pgf ts
+ if isOpt "v" opts
+ then putStrLn $
+ unlines [H.showExpr [] t ++ "\t--" ++ show d | (t,d) <- tds]
+ else return ()
+ returnFromExprs $ map fst tds,
+ flags = [
+ ("probs","probabilities from this file (format 'f 0.6' per line)")
+ ],
+ options = [
+ ("v","show all trees with their probability scores")
+ ],
+ examples = [
+ mkEx "p \"you are here\" | rt -probs=probs | pt -number=1 -- most probable result"
+ ]
+ }),
+
+ ("tq", emptyCommandInfo {
+ longname = "translation_quiz",
+ syntax = "tq -from=LANG -to=LANG (-cat=CAT)? (-probs=FILE)? TREE?",
+ synopsis = "start a translation quiz",
+ exec = \env@(pgf, mos) opts xs -> do
+ let from = optLangFlag "from" pgf opts
+ let to = optLangFlag "to" pgf opts
+ let typ = optType pgf opts
+ let mt = mexp xs
+ pgf <- optProbs opts pgf
+ restricted $ translationQuiz mt pgf from to typ
+ return void,
+ flags = [
+ ("from","translate from this language"),
+ ("to","translate to this language"),
+ ("cat","translate in this category"),
+ ("number","the maximum number of questions"),
+ ("probs","file with biased probabilities for generation")
+ ],
+ examples = [
+ mkEx ("tq -from=Eng -to=Swe -- any trees in startcat"),
+ mkEx ("tq -from=Eng -to=Swe (AdjCN (PositA ?2) (UseN ?)) -- only trees of this form")
+ ]
+ }),
+
+ ("sd", emptyCommandInfo {
+ longname = "show_dependencies",
+ syntax = "sd QUALIFIED_CONSTANT+",
+ synopsis = "show all constants that the given constants depend on",
+ explanation = unlines [
+ "Show recursively all qualified constant names, by tracing back the types and definitions",
+ "of each constant encountered, but just listing every name once.",
+ "This command requires a source grammar to be in scope, imported with 'import -retain'.",
+ "Notice that the accuracy is better if the modules are compiled with the flag -optimize=noexpand.",
+ "This command must be a line of its own, and thus cannot be a part of a pipe."
+ ],
+ options = [
+ ("size","show the size of the source code for each constants (number of constructors)")
+ ],
+ examples = [
+ mkEx "sd ParadigmsEng.mkV ParadigmsEng.mkN -- show all constants on which mkV and mkN depend",
+ mkEx "sd -size ParadigmsEng.mkV -- show all constants on which mkV depends, together with size"
+ ],
+ needsTypeCheck = False
+ }),
+-}
+ ("se", emptyCommandInfo {
+ longname = "set_encoding",
+ synopsis = "set the encoding used in current terminal",
+ syntax = "se ID",
+ examples = [
+ mkEx "se cp1251 -- set encoding to cp1521",
+ mkEx "se utf8 -- set encoding to utf8 (default)"
+ ],
+ needsTypeCheck = False
+ }),
+ ("sp", emptyCommandInfo {
+ longname = "system_pipe",
+ synopsis = "send argument to a system command",
+ syntax = "sp -command=\"SYSTEMCOMMAND\", alt. ? SYSTEMCOMMAND",
+ exec = \_ opts arg -> do
+ let syst = optComm opts -- ++ " " ++ tmpi
+ {-
+ let tmpi = "_tmpi" ---
+ let tmpo = "_tmpo"
+ restricted $ writeFile tmpi $ toString arg
+ restrictedSystem $ syst ++ " <" ++ tmpi ++ " >" ++ tmpo
+ fmap fromString $ restricted $ readFile tmpo,
+ -}
+ fmap fromString . restricted . readShellProcess syst $ toString arg,
+ flags = [
+ ("command","the system command applied to the argument")
+ ],
+ examples = [
+ mkEx "gt | l | ? wc -- generate trees, linearize, and count words"
+ ]
+ }),
+{-
+ ("so", emptyCommandInfo {
+ longname = "show_operations",
+ syntax = "so (-grep=STRING)* TYPE?",
+ synopsis = "show all operations in scope, possibly restricted to a value type",
+ explanation = unlines [
+ "Show the names and type signatures of all operations available in the current resource.",
+ "This command requires a source grammar to be in scope, imported with 'import -retain'.",
+ "The operations include the parameter constructors that are in scope.",
+ "The optional TYPE filters according to the value type.",
+ "The grep STRINGs filter according to other substrings of the type signatures.",
+ "This command must be a line of its own, and thus cannot be a part",
+ "of a pipe."
+ ],
+ flags = [
+ ("grep","substring used for filtering (the command can have many of these)")
+ ],
+ options = [
+ ("raw","show the types in computed forms (instead of category names)")
+ ],
+ needsTypeCheck = False
+ }),
+
+ ("ss", emptyCommandInfo {
+ longname = "show_source",
+ syntax = "ss (-strip)? (-save)? MODULE*",
+ synopsis = "show the source code of modules in scope, possibly just headers",
+ explanation = unlines [
+ "Show compiled source code, i.e. as it is included in GF object files.",
+ "This command requires a source grammar to be in scope, imported with 'import -retain'.",
+ "The optional MODULE arguments cause just these modules to be shown.",
+ "The -size and -detailedsize options show code size as the number of constructor nodes.",
+ "This command must be a line of its own, and thus cannot be a part of a pipe."
+ ],
+ options = [
+ ("detailedsize", "instead of code, show the sizes of all judgements and modules"),
+ ("save", "save each MODULE in file MODULE.gfh instead of printing it on terminal"),
+ ("size", "instead of code, show the sizes of all modules"),
+ ("strip","show only type signatures of oper's and lin's, not their definitions")
+ ],
+ examples = [
+ mkEx "ss -- print complete current source grammar on terminal",
+ mkEx "ss -strip -save MorphoFin -- print the headers in file MorphoFin.gfh"
+ ],
+ needsTypeCheck = False
+ }),
+-}
+ ("ut", emptyCommandInfo {
+ longname = "unicode_table",
+ synopsis = "show a transliteration table for a unicode character set",
+ exec = \_ opts _ -> do
+ let t = concatMap prOpt (take 1 opts)
+ let out = maybe "no such transliteration" characterTable $ transliteration t
+ return $ fromString out,
+ options = transliterationPrintNames
+ }),
+{-
+ ("vd", emptyCommandInfo {
+ longname = "visualize_dependency",
+ synopsis = "show word dependency tree graphically",
+ explanation = unlines [
+ "Prints a dependency tree in the .dot format (the graphviz format, default)",
+ "or the CoNLL/MaltParser format (flag -output=conll for training, malt_input",
+ "for unanalysed input).",
+ "By default, the last argument is the head of every abstract syntax",
+ "function; moreover, the head depends on the head of the function above.",
+ "The graph can be saved in a file by the wf command as usual.",
+ "If the -view flag is defined, the graph is saved in a temporary file",
+ "which is processed by graphviz and displayed by the program indicated",
+ "by the flag. The target format is png, unless overridden by the",
+ "flag -format."
+ ],
+ exec = \env@(pgf, mos) opts es -> do
+ let debug = isOpt "v" opts
+ let file = valStrOpts "file" "" opts
+ let outp = valStrOpts "output" "dot" opts
+ mlab <- case file of
+ "" -> return Nothing
+ _ -> (Just . H.getDepLabels . lines) `fmap` restricted (readFile file)
+ let lang = optLang pgf opts
+ let grphs = unlines $ map (H.graphvizDependencyTree outp debug mlab Nothing pgf lang) es
+ if isFlag "view" opts || isFlag "format" opts then do
+ let file s = "_grphd." ++ s
+ let view = optViewGraph opts
+ let format = optViewFormat opts
+ restricted $ writeUTF8File (file "dot") grphs
+ restrictedSystem $ "dot -T" ++ format ++ " " ++ file "dot" ++ " > " ++ file format
+ restrictedSystem $ view ++ " " ++ file format
+ return void
+ else return $ fromString grphs,
+ examples = [
+ mkEx "gr | vd -- generate a tree and show dependency tree in .dot",
+ mkEx "gr | vd -view=open -- generate a tree and display dependency tree on a Mac",
+ mkEx "gr -number=1000 | vd -file=dep.labels -output=malt -- generate training treebank",
+ mkEx "gr -number=100 | vd -file=dep.labels -output=malt_input -- generate test sentences"
+ ],
+ options = [
+ ("v","show extra information")
+ ],
+ flags = [
+ ("file","configuration file for labels per fun, format 'fun l1 ... label ... l2'"),
+ ("format","format of the visualization file (default \"png\")"),
+ ("output","output format of graph source (default \"dot\")"),
+ ("view","program to open the resulting file (default \"open\")"),
+ ("lang","the language of analysis")
+ ]
+ }),
+
+
+ ("vp", emptyCommandInfo {
+ longname = "visualize_parse",
+ synopsis = "show parse tree graphically",
+ explanation = unlines [
+ "Prints a parse tree in the .dot format (the graphviz format).",
+ "The graph can be saved in a file by the wf command as usual.",
+ "If the -view flag is defined, the graph is saved in a temporary file",
+ "which is processed by graphviz and displayed by the program indicated",
+ "by the flag. The target format is png, unless overridden by the",
+ "flag -format."
+ ],
+ exec = \env@(pgf, mos) opts es -> do
+ let lang = optLang pgf opts
+ let gvOptions=H.GraphvizOptions {H.noLeaves = isOpt "noleaves" opts && not (isOpt "showleaves" opts),
+ H.noFun = isOpt "nofun" opts || not (isOpt "showfun" opts),
+ H.noCat = isOpt "nocat" opts && not (isOpt "showcat" opts),
+ H.nodeFont = valStrOpts "nodefont" "" opts,
+ H.leafFont = valStrOpts "leaffont" "" opts,
+ H.nodeColor = valStrOpts "nodecolor" "" opts,
+ H.leafColor = valStrOpts "leafcolor" "" opts,
+ H.nodeEdgeStyle = valStrOpts "nodeedgestyle" "solid" opts,
+ H.leafEdgeStyle = valStrOpts "leafedgestyle" "dashed" opts
+ }
+ let grph = if null es
+ then []
+ else H.graphvizParseTree pgf lang gvOptions (head es)
+ if isFlag "view" opts || isFlag "format" opts then do
+ let file s = "_grph." ++ s
+ let view = optViewGraph opts
+ let format = optViewFormat opts
+ restricted $ writeUTF8File (file "dot") grph
+ restrictedSystem $ "dot -T" ++ format ++ " " ++ file "dot" ++ " > " ++ file format
+ restrictedSystem $ view ++ " " ++ file format
+ return void
+ else return $ fromString grph,
+ examples = [
+ mkEx "p \"John walks\" | vp -- generate a tree and show parse tree as .dot script",
+ mkEx "gr | vp -view=\"open\" -- generate a tree and display parse tree on a Mac"
+ ],
+ options = [
+ ("showcat","show categories in the tree nodes (default)"),
+ ("nocat","don't show categories"),
+ ("showfun","show function names in the tree nodes"),
+ ("nofun","don't show function names (default)"),
+ ("showleaves","show the leaves of the tree (default)"),
+ ("noleaves","don't show the leaves of the tree (i.e., only the abstract tree)")
+ ],
+ flags = [
+ ("format","format of the visualization file (default \"png\")"),
+ ("view","program to open the resulting file (default \"open\")"),
+ ("nodefont","font for tree nodes (default: Times -- graphviz standard font)"),
+ ("leaffont","font for tree leaves (default: nodefont)"),
+ ("nodecolor","color for tree nodes (default: black -- graphviz standard color)"),
+ ("leafcolor","color for tree leaves (default: nodecolor)"),
+ ("nodeedgestyle","edge style between tree nodes (solid/dashed/dotted/bold, default: solid)"),
+ ("leafedgestyle","edge style for links to leaves (solid/dashed/dotted/bold, default: dashed)")
+ ]
+ }),
+
+ ("vt", emptyCommandInfo {
+ longname = "visualize_tree",
+ synopsis = "show a set of trees graphically",
+ explanation = unlines [
+ "Prints a set of trees in the .dot format (the graphviz format).",
+ "The graph can be saved in a file by the wf command as usual.",
+ "If the -view flag is defined, the graph is saved in a temporary file",
+ "which is processed by graphviz and displayed by the program indicated",
+ "by the flag. The target format is postscript, unless overridden by the",
+ "flag -format.",
+ "With option -mk, use for showing library style function names of form 'mkC'."
+ ],
+ exec = \env@(pgf, mos) opts es ->
+ if isOpt "mk" opts
+ then return $ fromString $ unlines $ map (tree2mk pgf) es
+ else if isOpt "api" opts
+ then do
+ let ss = map exprToAPI es
+ mapM_ putStrLn ss
+ return void
+ else do
+ let funs = not (isOpt "nofun" opts)
+ let cats = not (isOpt "nocat" opts)
+ let grph = unlines (map (H.graphvizAbstractTree pgf (funs,cats)) es) -- True=digraph
+ if isFlag "view" opts || isFlag "format" opts then do
+ let file s = "_grph." ++ s
+ let view = optViewGraph opts
+ let format = optViewFormat opts
+ restricted $ writeUTF8File (file "dot") grph
+ restrictedSystem $ "dot -T" ++ format ++ " " ++ file "dot" ++ " > " ++ file format
+ restrictedSystem $ view ++ " " ++ file format
+ return void
+ else return $ fromString grph,
+ examples = [
+ mkEx "p \"hello\" | vt -- parse a string and show trees as graph script",
+ mkEx "p \"hello\" | vt -view=\"open\" -- parse a string and display trees on a Mac"
+ ],
+ options = [
+ ("api", "show the tree with function names converted to 'mkC' with value cats C"),
+ ("mk", "similar to -api, deprecated"),
+ ("nofun","don't show functions but only categories"),
+ ("nocat","don't show categories but only functions")
+ ],
+ flags = [
+ ("format","format of the visualization file (default \"png\")"),
+ ("view","program to open the resulting file (default \"open\")")
+ ]
+ }),
+-}
+ ("wf", emptyCommandInfo {
+ longname = "write_file",
+ synopsis = "send string or tree to a file",
+ exec = \_ opts arg -> do
+ let file = valStrOpts "file" "_gftmp" opts
+ if isOpt "append" opts
+ then restricted $ appendFile file (toString arg)
+ else restricted $ writeUTF8File file (toString arg)
+ return void,
+ options = [
+ ("append","append to file, instead of overwriting it")
+ ],
+ flags = [("file","the output filename")]
+ }){-,
+ ("ai", emptyCommandInfo {
+ longname = "abstract_info",
+ syntax = "ai IDENTIFIER or ai EXPR",
+ synopsis = "Provides an information about a function, an expression or a category from the abstract syntax",
+ explanation = unlines [
+ "The command has one argument which is either function, expression or",
+ "a category defined in the abstract syntax of the current grammar. ",
+ "If the argument is a function then ?its type is printed out.",
+ "If it is a category then the category definition is printed.",
+ "If a whole expression is given it prints the expression with refined",
+ "metavariables and the type of the expression."
+ ],
+ exec = \env@(pgf, mos) opts arg -> do
+ case arg of
+ [H.EFun id]->case Map.lookup id (H.funs (H.abstract pgf)) of
+ Just fd -> do putStrLn $ render (H.ppFun id fd)
+ let (_,_,_,prob) = fd
+ putStrLn ("Probability: "++show prob)
+ return void
+ Nothing -> case Map.lookup id (H.cats (H.abstract pgf)) of
+ Just cd -> do putStrLn $
+ render (H.ppCat id cd $$
+ if null (H.functionsToCat pgf id)
+ then empty
+ else ' ' $$
+ vcat [H.ppFun fid (ty,0,Just ([],[]),0) | (fid,ty) <- H.functionsToCat pgf id] $$
+ ' ')
+ let (_,_,prob) = cd
+ putStrLn ("Probability: "++show prob)
+ return void
+ Nothing -> do putStrLn ("unknown category of function identifier "++show id)
+ return void
+ [e] -> case H.inferExpr pgf e of
+ Left tcErr -> error $ render (H.ppTcError tcErr)
+ Right (e,ty) -> do putStrLn ("Expression: "++H.showExpr [] e)
+ putStrLn ("Type: "++H.showType [] ty)
+ putStrLn ("Probability: "++show (H.probTree pgf e))
+ return void
+ _ -> do putStrLn "a single identifier or expression is expected from the command"
+ return void,
+ needsTypeCheck = False
+ })-}
+ ]
+ where
+{-
+ par pgf opts s = case optOpenTypes opts of
+ [] -> [H.parse_ pgf lang (optType pgf opts) (Just dp) s | lang <- optLangs pgf opts]
+ open_typs -> [H.parseWithRecovery pgf lang (optType pgf opts) open_typs (Just dp) s | lang <- optLangs pgf opts]
+ where
+ dp = valIntOpts "depth" 4 opts
+-}
+ cParse env@(pgf,_) opts ss =
+ parsed [ C.parse cnc cat s | s<-ss,(lang,cnc)<-cncs]
+ where
+ cat = optCat pgf opts
+ cncs = optConcs env opts
+ parsed rs = Piped (ts,unlines msgs)
+ where
+ ts = [hsExpr t|Right ts<-rs,(t,p)<-takeOptNum opts ts]
+ msgs = concatMap (either err ok) rs
+ err msg = ["Parse failed: "++msg]
+ ok = map (C.showExpr . fst).takeOptNum opts
+
+ cLins env opts ts = [C.linearize cnc t|t<-ts,(lang,cnc)<-cncs]
+ where
+ cncs = optConcs env opts
+
+ optConcs = optConcsFlag "lang"
+
+ optConcsFlag f (pgf,cncs) opts =
+ case valStrOpts f "" opts of
+ "" -> Map.toList cncs
+ lang -> mapMaybe pickLang (chunks ',' lang)
+ where
+ pickLang l = pick l `mplus` pick fl
+ where
+ fl = C.abstractName pgf++l
+ pick l = (,) l `fmap` Map.lookup l cncs
+
+{-
+ optLins pgf opts ts = case opts of
+ _ | isOpt "groups" opts ->
+ map (unlines . snd) $ H.groupResults
+ [[(lang, linear pgf opts lang t) | lang <- optLangs pgf opts] | t <- ts]
+ _ -> map (optLin pgf opts) ts
+ optLin pgf opts t = unlines $
+ case opts of
+ _ | isOpt "treebank" opts && isOpt "chunks" opts ->
+ (H.showCId (H.abstractName pgf) ++ ": " ++ H.showExpr [] t) :
+ [H.showCId lang ++ ": " ++ li | (lang,li) <- linChunks pgf opts t] --linear pgf opts lang t | lang <- optLangs pgf opts]
+ _ | isOpt "treebank" opts ->
+ (H.showCId (H.abstractName pgf) ++ ": " ++ H.showExpr [] t) :
+ [H.showCId lang ++ ": " ++ linear pgf opts lang t | lang <- optLangs pgf opts]
+ _ | isOpt "chunks" opts -> map snd $ linChunks pgf opts t
+ _ -> [linear pgf opts lang t | lang <- optLangs pgf opts]
+ linChunks pgf opts t =
+ [(lang, unwords (intersperse "<+>" (map (linear pgf opts lang) (treeChunks t)))) | lang <- optLangs pgf opts]
+
+ linear :: H.PGF -> [Option] -> H.CId -> H.Expr -> String
+ linear pgf opts lang = let unl = unlex opts lang in case opts of
+ _ | isOpt "all" opts -> unlines . concat . intersperse [[]] .
+ map (map (unl . snd)) . H.tabularLinearizes pgf lang
+ _ | isOpt "list" opts -> commaList . concat . intersperse [[]] .
+ map (map (unl . snd)) . H.tabularLinearizes pgf lang
+ _ | isOpt "table" opts -> unlines . concat . intersperse [[]] .
+ map (map (\(p,v) -> p+++":"+++unl v)) . H.tabularLinearizes pgf lang
+ _ | isOpt "bracket" opts -> unwords . map H.showBracketedString . H.bracketedLinearize pgf lang
+ _ -> unl . H.linearize pgf lang
+
+ -- replace each non-atomic constructor with mkC, where C is the val cat
+ tree2mk pgf = H.showExpr [] . t2m where
+ t2m t = case H.unApp t of
+ Just (cid,ts@(_:_)) -> H.mkApp (mk cid) (map t2m ts)
+ _ -> t
+ mk = H.mkCId . ("mk" ++) . H.showCId . H.lookValCat (H.abstract pgf)
+-}
+ unlex opts lang = stringOps Nothing (getUnlex opts lang ++ map prOpt opts) ----
+
+ getUnlex opts lang = case words (valStrOpts "unlexer" "" opts) of
+ lexs -> case lookup lang
+ [(H.mkCId la,tail le) | lex <- lexs, let (la,le) = span (/='=') lex, not (null le)] of
+ Just le -> chunks ',' le
+ _ -> []
+{-
+ commaList [] = []
+ commaList ws = concat $ head ws : map (", " ++) (tail ws)
+-}
+-- Proposed logic of coding in unlexing:
+-- - If lang has no coding flag, or -to_utf8 is not in opts, just opts are used.
+-- - If lang has flag coding=utf8, -to_utf8 is ignored.
+-- - If lang has coding=other, and -to_utf8 is in opts, from_other is applied first.
+-- THIS DOES NOT WORK UNFORTUNATELY - can't use the grammar flag properly
+{-
+ unlexx pgf opts lang = {- trace (unwords optsC) $ -} stringOps Nothing optsC where ----
+ optsC = case lookConcrFlag pgf (H.mkCId lang) (H.mkCId "coding") of
+ Just (LStr "utf8") -> filter (/="to_utf8") $ map prOpt opts
+ Just (LStr other) | isOpt "to_utf8" opts ->
+ let cod = ("from_" ++ other)
+ in cod : filter (/=cod) (map prOpt opts)
+ _ -> map prOpt opts
+
+ optRestricted opts pgf =
+ H.restrictPGF (\f -> and [H.hasLin pgf la f | la <- optLangs pgf opts]) pgf
+
+ optLang = optLangFlag "lang"
+ optLangs = optLangsFlag "lang"
+
+ optLangsFlag f pgf opts = case valStrOpts f "" opts of
+ "" -> H.languages pgf
+ lang -> map (completeLang pgf) (chunks ',' lang)
+
+ completeLang pgf la = let cla = (H.mkCId la) in
+ if elem cla (H.languages pgf)
+ then cla
+ else (H.mkCId (H.showCId (H.abstractName pgf) ++ la))
+
+ optLangFlag f pgf opts = head $ optLangsFlag f pgf opts ++ [H.wildCId]
+
+ optOpenTypes opts = case valStrOpts "openclass" "" opts of
+ "" -> []
+ cats -> mapMaybe H.readType (chunks ',' cats)
+
+ optProbs opts pgf = case valStrOpts "probs" "" opts of
+ "" -> return pgf
+ file -> do
+ probs <- restricted $ H.readProbabilitiesFromFile file pgf
+ return (H.setProbabilities probs pgf)
+-}
+ optTranslit opts = case (valStrOpts "to" "" opts, valStrOpts "from" "" opts) of
+ ("","") -> return id
+ (file,"") -> do
+ src <- restricted $ readFile file
+ return $ transliterateWithFile file src False
+ (_,file) -> do
+ src <- restricted $ readFile file
+ return $ transliterateWithFile file src True
+{-
+ optFile opts = valStrOpts "file" "_gftmp" opts
+-}
+ optCat pgf opts = valStrOpts "cat" (C.startCat pgf) opts
+{-
+ optType pgf opts =
+ let str = valStrOpts "cat" (H.showCId $ H.lookStartCat pgf) opts
+ in case H.readType str of
+ Just ty -> case H.checkType pgf ty of
+ Left tcErr -> error $ render (H.ppTcError tcErr)
+ Right ty -> ty
+ Nothing -> error ("Can't parse '"++str++"' as a type")
+-}
+ optComm opts = valStrOpts "command" "" opts
+{-
+ optViewFormat opts = valStrOpts "format" "png" opts
+ optViewGraph opts = valStrOpts "view" "open" opts
+ optNum opts = valIntOpts "number" 1 opts
+-}
+ optNumInf opts = valIntOpts "number" 1000000000 opts ---- 10^9
+ takeOptNum opts = take (optNumInf opts)
+{-
+ fromParse opts [] = ([],[])
+ fromParse opts ((s,(po,bs)):ps)
+ | isOpt "bracket" opts = (es, H.showBracketedString bs
+ ++ "\n" ++ msg)
+ | otherwise = case po of
+ H.ParseOk ts -> let Piped (es',msg') = fromExprs ts
+ in (es'++es,msg'++msg)
+ H.TypeError errs -> ([], render ("The parsing is successful but the type checking failed with error(s):" $$
+ nest 2 (vcat (map (H.ppTcError . snd) errs)))
+ ++ "\n" ++ msg)
+ H.ParseFailed i -> ([], "The parser failed at token " ++ show (words s !! max 0 (i-1))
+ ++ "\n" ++ msg)
+ H.ParseIncomplete-> ([], "The sentence is not complete")
+ where
+ (es,msg) = fromParse opts ps
+-}
+ returnFromCExprs = returnFromExprs . map hsExpr
+ returnFromExprs es =
+ return $ case es of
+ [] -> pipeMessage "no trees found"
+ _ -> fromExprs es
+{-
+ prGrammar env@(pgf,mos) opts
+ | isOpt "pgf" opts = do
+ let pgf1 = if isOpt "opt" opts then H.optimizePGF pgf else pgf
+ let outfile = valStrOpts "file" (H.showCId (H.abstractName pgf) ++ ".pgf") opts
+ restricted $ encodeFile outfile pgf1
+ putStrLn $ "wrote file " ++ outfile
+ return void
+ | isOpt "cats" opts = return $ fromString $ unwords $ map H.showCId $ H.categories pgf
+ | isOpt "funs" opts = return $ fromString $ unlines $ map showFun $ funsigs pgf
+ | isOpt "fullform" opts = return $ fromString $ concatMap (morpho mos "" prFullFormLexicon) $ optLangs pgf opts
+ | isOpt "langs" opts = return $ fromString $ unwords $ map H.showCId $ H.languages pgf
+
+ | isOpt "lexc" opts = return $ fromString $ concatMap (morpho mos "" prLexcLexicon) $ optLangs pgf opts
+ | isOpt "missing" opts = return $ fromString $ unlines $ [unwords (H.showCId la:":": map H.showCId cs) |
+ la <- optLangs pgf opts, let cs = H.missingLins pgf la]
+ | isOpt "words" opts = return $ fromString $ concatMap (morpho mos "" prAllWords) $ optLangs pgf opts
+ | otherwise = do fmt <- readOutputFormat (valStrOpts "printer" "pgf_pretty" opts)
+ return $ fromString $ concatMap snd $ exportPGF noOptions fmt pgf
+
+ funsigs pgf = [(f,ty) | (f,(ty,_,_,_)) <- Map.assocs (H.funs (H.abstract pgf))]
+ showFun (f,ty) = H.showCId f ++ " : " ++ H.showType [] ty ++ " ;"
+
+ morphos (pgf,mos) opts s =
+ [(s,morpho mos [] (\mo -> H.lookupMorpho mo s) la) | la <- optLangs pgf opts]
+
+ morpho mos z f la = maybe z f $ Map.lookup la mos
+
+ optMorpho (pgf,mos) opts = morpho mos (error "no morpho") id (head (optLangs pgf opts))
+
+ optClitics opts = case valStrOpts "clitics" "" opts of
+ "" -> []
+ cs -> map reverse $ chunks ',' cs
+
+ mexp xs = case xs of
+ t:_ -> Just t
+ _ -> Nothing
+-}
+ -- ps -f -g s returns g (f s)
+ stringOps menv opts s = foldr (menvop . app) s (reverse opts) where
+ app f = maybe id id (stringOp f)
+ menvop op = maybe op (\ (b,e) -> opInEnv b e op) menv
+
+ envFlag fs = case valStrOpts "env" "global" fs of
+ "quotes" -> Just ("\"","\"")
+ _ -> Nothing
+{-
+ treeOps pgf opts s = foldr app s (reverse opts) where
+ app (OOpt op) | Just (Left f) <- treeOp pgf op = f
+ app (OFlag op (VId x)) | Just (Right f) <- treeOp pgf op = f (H.mkCId x)
+ app _ = id
+-}
+stringOpOptions = sort $ [
+ ("bind","bind tokens separated by Prelude.BIND, i.e. &+"),
+ ("chars","lexer that makes every non-space character a token"),
+ ("from_cp1251","decode from cp1251 (Cyrillic used in Bulgarian resource)"),
+ ("from_utf8","decode from utf8 (default)"),
+ ("lextext","text-like lexer"),
+ ("lexcode","code-like lexer"),
+ ("lexmixed","mixture of text and code, as in LaTeX (code between $...$, \\(...)\\, \\[...\\])"),
+ ("to_cp1251","encode to cp1251 (Cyrillic used in Bulgarian resource)"),
+ ("to_html","wrap in a html file with linebreaks"),
+ ("to_utf8","encode to utf8 (default)"),
+ ("unlextext","text-like unlexer"),
+ ("unlexcode","code-like unlexer"),
+ ("unlexmixed","mixture of text and code (code between $...$, \\(...)\\, \\[...\\])"),
+ ("unchars","unlexer that puts no spaces between tokens"),
+ ("unwords","unlexer that puts a single space between tokens (default)"),
+ ("words","lexer that assumes tokens separated by spaces (default)")
+ ] ++
+ concat [
+ [("from_" ++ p, "from unicode to GF " ++ n ++ " transliteration"),
+ ("to_" ++ p, "from GF " ++ n ++ " transliteration to unicode")] |
+ (p,n) <- transliterationPrintNames]
+{-
+treeOpOptions pgf = [(op,expl) | (op,(expl,Left _)) <- allTreeOps pgf]
+treeOpFlags pgf = [(op,expl) | (op,(expl,Right _)) <- allTreeOps pgf]
+
+translationQuiz :: Maybe H.Expr -> H.PGF -> H.Language -> H.Language -> H.Type -> IO ()
+translationQuiz mex pgf ig og typ = do
+ tts <- translationList mex pgf ig og typ infinity
+ mkQuiz "Welcome to GF Translation Quiz." tts
+
+morphologyQuiz :: Maybe H.Expr -> H.PGF -> H.Language -> H.Type -> IO ()
+morphologyQuiz mex pgf ig typ = do
+ tts <- morphologyList mex pgf ig typ infinity
+ mkQuiz "Welcome to GF Morphology Quiz." tts
+
+-- | the maximal number of precompiled quiz problems
+infinity :: Int
+infinity = 256
+
+prLexcLexicon :: H.Morpho -> String
+prLexcLexicon mo =
+ unlines $ "Multichar_Symbols":multichars:"":"LEXICON Root" : [prLexc l p ++ ":" ++ w ++ " # ;" | (w,lps) <- morpho, (l,p) <- lps] ++ ["END"]
+ where
+ morpho = H.fullFormLexicon mo
+ prLexc l p = H.showCId l ++ concat (mkTags (words p))
+ mkTags p = case p of
+ "s":ws -> mkTags ws --- remove record field
+ ws -> map ('+':) ws
+
+ multichars = unwords $ nub $ concat [mkTags (words p) | (w,lps) <- morpho, (l,p) <- lps]
+ -- thick_A+(AAdj+Posit+Gen):thick's # ;
+
+prFullFormLexicon :: H.Morpho -> String
+prFullFormLexicon mo =
+ unlines (map prMorphoAnalysis (H.fullFormLexicon mo))
+
+prAllWords :: H.Morpho -> String
+prAllWords mo =
+ unwords [w | (w,_) <- H.fullFormLexicon mo]
+
+prMorphoAnalysis :: (String,[(H.Lemma,H.Analysis)]) -> String
+prMorphoAnalysis (w,lps) =
+ unlines (w:[H.showCId l ++ " : " ++ p | (l,p) <- lps])
+-}
+
+trie = render . pptss . H.toTrie . map H.toATree
+ where
+ pptss [ts] = "*"<+>nest 2 (ppts ts)
+ pptss tss = vcat [i<+>nest 2 (ppts ts)|(i,ts)<-zip [(1::Int)..] tss]
+
+ ppts = vcat . map ppt
+
+ ppt t =
+ case t of
+ H.Oth e -> pp (H.showExpr [] e)
+ H.Ap f [[]] -> pp (H.showCId f)
+ H.Ap f tss -> H.showCId f $$ nest 2 (pptss tss)
+
+hsExpr c =
+ case C.unApp c of
+ Just (f,cs) -> H.mkApp (H.mkCId f) (map hsExpr cs)
+ _ -> error "GF.Command.Commands2.hsExpr"
+
+cExpr e =
+ case H.unApp e of
+ Just (f,es) -> C.mkApp (H.showCId f) (map cExpr es)
+ _ -> error "GF.Command.Commands2.cExpr"
+
+needPGF exec (mb_pgf,cncs) opts ts =
+ case mb_pgf of
+ Just pgf -> exec (pgf,cncs) opts ts
+ _ -> fail "Import a grammar before using this command"