forked from GitHub/gf-core
113 lines
3.0 KiB
C
113 lines
3.0 KiB
C
// Don't give too much hope to this script. It is doing the wrong thing
|
|
// but let's see how far we can get with it.
|
|
|
|
#include <gu/variant.h>
|
|
#include <gu/map.h>
|
|
#include <gu/dump.h>
|
|
#include <gu/log.h>
|
|
#include <gu/enum.h>
|
|
#include <gu/file.h>
|
|
#include <pgf/pgf.h>
|
|
#include <pgf/parser.h>
|
|
#include <pgf/lexer.h>
|
|
#include <pgf/literals.h>
|
|
#include <pgf/linearizer.h>
|
|
#include <pgf/expr.h>
|
|
#include <pgf/edsl.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <locale.h>
|
|
#include <time.h>
|
|
|
|
int main(int argc, char* argv[]) {
|
|
// Set the character locale, so we can produce proper output.
|
|
setlocale(LC_CTYPE, "");
|
|
|
|
// Create the pool that is used to allocate everything
|
|
GuPool* pool = gu_new_pool();
|
|
int status = EXIT_SUCCESS;
|
|
if (argc != 4) {
|
|
fprintf(stderr, "usage: %s pgf cat from_lang\n", argv[0]);
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
char* filename = argv[1];
|
|
|
|
GuString cat = gu_str_string(argv[2], pool);
|
|
|
|
GuString from_lang = gu_str_string(argv[3], pool);
|
|
|
|
// Create an exception frame that catches all errors.
|
|
GuExn* err = gu_new_exn(NULL, gu_kind(type), pool);
|
|
|
|
// Read the PGF grammar.
|
|
PgfPGF* pgf = pgf_read(filename, pool, err);
|
|
|
|
// If an error occured, it shows in the exception frame
|
|
if (!gu_ok(err)) {
|
|
fprintf(stderr, "Reading PGF failed\n");
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
|
|
pgf_load_meta_child_probs(pgf, "../../../treebanks/PennTreebank/ParseEngAbs3.probs", pool, err);
|
|
if (!gu_ok(err)) {
|
|
fprintf(stderr, "Loading meta child probs failed\n");
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
|
|
// Look up the source and destination concrete categories
|
|
PgfConcr* from_concr = pgf_get_language(pgf, from_lang);
|
|
if (!from_concr) {
|
|
fprintf(stderr, "Unknown language\n");
|
|
status = EXIT_FAILURE;
|
|
goto fail_concr;
|
|
}
|
|
|
|
// Register a callback for the literal category Symbol
|
|
pgf_parser_add_literal(from_concr, gu_str_string("Symb", pool),
|
|
&pgf_nerc_literal_callback);
|
|
|
|
// We will keep the latest results in the 'ppool' and
|
|
// we will iterate over them by using 'result'.
|
|
GuPool* ppool = NULL;
|
|
|
|
// The interactive translation loop.
|
|
// XXX: This currently reads stdin directly, so it doesn't support
|
|
// encodings properly. TODO: use a locale reader for input
|
|
while (true) {
|
|
char buf[4096];
|
|
char* line = fgets(buf, sizeof(buf), stdin);
|
|
if (line == NULL) {
|
|
if (ferror(stdin)) {
|
|
fprintf(stderr, "Input error\n");
|
|
status = EXIT_FAILURE;
|
|
}
|
|
break;
|
|
} else if (strcmp(line, "") == 0) {
|
|
// End nicely on empty input
|
|
break;
|
|
}
|
|
|
|
// We create a temporary pool for translating a single
|
|
// sentence, so our memory usage doesn't increase over time.
|
|
ppool = gu_new_pool();
|
|
|
|
GuReader *rdr =
|
|
gu_string_reader(gu_str_string(line, ppool), ppool);
|
|
PgfLexer *lexer =
|
|
pgf_new_simple_lexer(rdr, ppool);
|
|
|
|
pgf_print_chunks(from_concr, cat, lexer, ppool);
|
|
|
|
// Free all resources allocated during parsing and linearization
|
|
gu_pool_free(ppool);
|
|
}
|
|
fail_concr:
|
|
fail:
|
|
gu_pool_free(pool);
|
|
return status;
|
|
}
|