forked from GitHub/gf-core
The API in the C runtime as well as in the Haskell, Python and Java binding is changed. Now instead of adding the literal callbacks to the concrete syntax you need to supply them every time when you need to parse. The main reason is: - referentially transparent API for Haskell - when we start using memory mapped files we will not be allowed to change anything in the grammar data structures. At that point the old API would be impossible to use.
134 lines
3.6 KiB
C
134 lines
3.6 KiB
C
#include <gu/variant.h>
|
|
#include <gu/map.h>
|
|
#include <gu/enum.h>
|
|
#include <gu/file.h>
|
|
#include <pgf/pgf.h>
|
|
#include <pgf/data.h>
|
|
#include <pgf/literals.h>
|
|
#include <pgf/linearizer.h>
|
|
#include <pgf/expr.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <locale.h>
|
|
#include <time.h>
|
|
|
|
int main(int argc, char* argv[]) {
|
|
// Set the character locale, so we can produce proper output.
|
|
setlocale(LC_CTYPE, "");
|
|
|
|
// Create the pool that is used to allocate everything
|
|
GuPool* pool = gu_new_pool();
|
|
int status = EXIT_SUCCESS;
|
|
if (argc < 4 || argc > 5) {
|
|
fprintf(stderr, "usage: %s pgf-file start-cat cnc-lang [heuristics]\n(0.0 <= heuristics < 1.0, default: 0.95)\n", argv[0]);
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
char* filename = argv[1];
|
|
GuString cat = argv[2];
|
|
GuString lang = argv[3];
|
|
|
|
double heuristics = 0.95;
|
|
if (argc == 5) {
|
|
heuristics = atof(argv[4]);
|
|
}
|
|
|
|
// Create an exception frame that catches all errors.
|
|
GuExn* err = gu_new_exn(pool);
|
|
|
|
|
|
clock_t start = clock();
|
|
|
|
// Read the PGF grammar.
|
|
PgfPGF* pgf = pgf_read(filename, pool, err);
|
|
|
|
// If an error occured, it shows in the exception frame
|
|
if (!gu_ok(err)) {
|
|
fprintf(stderr, "Reading PGF failed\n");
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
|
|
// Look up the source and destination concrete categories
|
|
PgfConcr* concr = pgf_get_language(pgf, lang);
|
|
if (!concr) {
|
|
fprintf(stderr, "Unknown language\n");
|
|
status = EXIT_FAILURE;
|
|
goto fail;
|
|
}
|
|
|
|
clock_t end = clock();
|
|
double cpu_time_used = ((double) (end - start)) / CLOCKS_PER_SEC;
|
|
|
|
fprintf(stderr, "(%.0f ms) Ready to parse [heuristics=%.2f]!\n", 1000.0 * cpu_time_used, heuristics);
|
|
|
|
// Create an output stream for stdout
|
|
GuOut* out = gu_file_out(stdout, pool);
|
|
|
|
// We will keep the latest results in the 'ppool' and
|
|
// we will iterate over them by using 'result'.
|
|
GuPool* ppool = NULL;
|
|
|
|
// The interactive PARSING loop.
|
|
// XXX: This currently reads stdin directly, so it doesn't support
|
|
// encodings properly. TODO: use a locale reader for input
|
|
for (int ctr = 0; true; ctr++) {
|
|
// We release the last results
|
|
if (ppool != NULL) {
|
|
gu_pool_free(ppool);
|
|
ppool = NULL;
|
|
}
|
|
|
|
/* fprintf(stdout, "> "); */
|
|
/* fflush(stdout); */
|
|
char buf[4096];
|
|
char* line = fgets(buf, sizeof(buf), stdin);
|
|
if (line == NULL) {
|
|
if (ferror(stdin)) {
|
|
fprintf(stderr, "Input error\n");
|
|
status = EXIT_FAILURE;
|
|
}
|
|
break;
|
|
} else if (strcmp(line, "") == 0) {
|
|
// End nicely on empty input
|
|
break;
|
|
} else if (strcmp(line, "\n") == 0) {
|
|
// Empty line -> skip
|
|
continue;
|
|
}
|
|
|
|
// We create a temporary pool for translating a single
|
|
// sentence, so our memory usage doesn't increase over time.
|
|
ppool = gu_new_pool();
|
|
|
|
clock_t start = clock();
|
|
|
|
GuExn* parse_err = gu_new_exn(ppool);
|
|
PgfCallbacksMap* callbacks = pgf_new_callbacks_map(concr, ppool);
|
|
GuEnum* result = pgf_parse_with_heuristics(concr, cat, line, heuristics, callbacks, parse_err, ppool, ppool);
|
|
|
|
PgfExprProb* ep = NULL;
|
|
if (gu_ok(parse_err))
|
|
ep = gu_next(result, PgfExprProb*, ppool);
|
|
|
|
clock_t end = clock();
|
|
double cpu_time_used = ((double) (end - start)) / CLOCKS_PER_SEC;
|
|
|
|
gu_printf(out, err, "%d (%.0f ms): ", ctr, 1000.0 * cpu_time_used);
|
|
if (ep != NULL) {
|
|
gu_printf(out, err, "[%.4f] (", ep->prob);
|
|
pgf_print_expr(ep->expr, NULL, 0, out, err);
|
|
gu_printf(out, err, ")\n");
|
|
} else {
|
|
gu_printf(out, err, "---\n");
|
|
}
|
|
gu_out_flush(out, err);
|
|
}
|
|
|
|
fail:
|
|
gu_pool_free(pool);
|
|
return status;
|
|
}
|
|
|