summaryrefslogtreecommitdiff
path: root/src/runtime/c
diff options
context:
space:
mode:
authorgregoire.detrez <gregoire.detrez@gu.se>2013-01-24 13:31:34 +0000
committergregoire.detrez <gregoire.detrez@gu.se>2013-01-24 13:31:34 +0000
commit0aae4702edbd4889159e3772b72d0a4c10b7e57a (patch)
tree4b04b948fffe0ef768c204a25b1628a7640b0b27 /src/runtime/c
parente7db50b9bdd710690c78038d095bf249a9ed7f02 (diff)
Python binding: add a parsing function that accepts directly a list of tokens.
Is allows to define a tokenizer in python (or use an existing one, from nltk for instance.)
Diffstat (limited to 'src/runtime/c')
-rw-r--r--src/runtime/c/pgf/pgf.c27
-rw-r--r--src/runtime/c/pgf/pgf.h3
2 files changed, 30 insertions, 0 deletions
diff --git a/src/runtime/c/pgf/pgf.c b/src/runtime/c/pgf/pgf.c
index ccee4bf24..2b720f093 100644
--- a/src/runtime/c/pgf/pgf.c
+++ b/src/runtime/c/pgf/pgf.c
@@ -227,6 +227,33 @@ pgf_parse(PgfConcr* concr, PgfCId cat, PgfLexer *lexer, GuPool* pool)
return pgf_parse_result(state, pool);
}
+// Same as previous but accept a list of tokens as input instead of a
+// lexer
+GuEnum*
+pgf_parse_tokens(PgfConcr* concr, PgfCId cat, char **tokens, int len, GuPool* pool)
+{
+ // Begin parsing a sentence of the specified category
+ PgfParseState* state =
+ pgf_parser_init_state(concr, cat, 0, pool);
+ if (state == NULL) {
+ return NULL;
+ }
+
+ // Parsing
+ PgfToken tok;
+ for (int i = 0; i < len; i++) {
+ tok = gu_str_string(tokens[i], pool);
+
+ state = pgf_parser_next_state(state, tok, pool);
+ if (state == NULL) {
+ return NULL;
+ }
+ }
+
+ // Now begin enumerating the resulting syntax trees
+ return pgf_parse_result(state, pool);
+}
+
void
pgf_print_chunks(PgfConcr* concr, PgfCId cat, PgfLexer *lexer, GuPool* pool)
{
diff --git a/src/runtime/c/pgf/pgf.h b/src/runtime/c/pgf/pgf.h
index 1f3947bff..afef6ec48 100644
--- a/src/runtime/c/pgf/pgf.h
+++ b/src/runtime/c/pgf/pgf.h
@@ -116,6 +116,9 @@ PgfExprEnum*
pgf_parse(PgfConcr* concr, PgfCId cat, PgfLexer *lexer, GuPool* pool);
PgfExprEnum*
+pgf_parse_tokens(PgfConcr* concr, PgfCId cat, char* tokens[], int len, GuPool* pool);
+
+PgfExprEnum*
pgf_generate(PgfPGF* pgf, PgfCId cat, GuPool* pool);
// an experimental function. Please don't use it