#include #include #include #include #include #include #include #include #include #include #include #include #include #include int main(int argc, char* argv[]) { // Set the character locale, so we can produce proper output. setlocale(LC_CTYPE, ""); // Create the pool that is used to allocate everything GuPool* pool = gu_new_pool(); int status = EXIT_SUCCESS; if (argc < 4 || argc > 5) { fprintf(stderr, "usage: %s pgf-file start-cat cnc-lang [heuristics]\n(0.0 <= heuristics < 1.0, default: 0.95)\n", argv[0]); status = EXIT_FAILURE; goto fail; } char* filename = argv[1]; GuString cat = argv[2]; GuString lang = argv[3]; double heuristics = 0.95; if (argc == 5) { heuristics = atof(argv[4]); } // Create an exception frame that catches all errors. GuExn* err = gu_new_exn(pool); clock_t start = clock(); // Read the PGF grammar. PgfPGF* pgf = pgf_read(filename, pool, err); // If an error occured, it shows in the exception frame if (!gu_ok(err)) { fprintf(stderr, "Reading PGF failed\n"); status = EXIT_FAILURE; goto fail; } // Look up the source and destination concrete categories PgfConcr* concr = pgf_get_language(pgf, lang); if (!concr) { fprintf(stderr, "Unknown language\n"); status = EXIT_FAILURE; goto fail; } clock_t end = clock(); double cpu_time_used = ((double) (end - start)) / CLOCKS_PER_SEC; fprintf(stderr, "(%.0f ms) Ready to parse [heuristics=%.2f]!\n", 1000.0 * cpu_time_used, heuristics); // Create an output stream for stdout GuOut* out = gu_file_out(stdout, pool); // We will keep the latest results in the 'ppool' and // we will iterate over them by using 'result'. GuPool* ppool = NULL; // The interactive PARSING loop. // XXX: This currently reads stdin directly, so it doesn't support // encodings properly. TODO: use a locale reader for input for (int ctr = 0; true; ctr++) { // We release the last results if (ppool != NULL) { gu_pool_free(ppool); ppool = NULL; } /* fprintf(stdout, "> "); */ /* fflush(stdout); */ char buf[4096]; char* line = fgets(buf, sizeof(buf), stdin); if (line == NULL) { if (ferror(stdin)) { fprintf(stderr, "Input error\n"); status = EXIT_FAILURE; } break; } else if (strcmp(line, "") == 0) { // End nicely on empty input break; } else if (strcmp(line, "\n") == 0) { // Empty line -> skip continue; } // We create a temporary pool for translating a single // sentence, so our memory usage doesn't increase over time. ppool = gu_new_pool(); clock_t start = clock(); GuExn* parse_err = gu_new_exn(ppool); PgfCallbacksMap* callbacks = pgf_new_callbacks_map(concr, ppool); GuEnum* result = pgf_parse_with_heuristics(concr, cat, line, heuristics, callbacks, parse_err, ppool, ppool); PgfExprProb* ep = NULL; if (gu_ok(parse_err)) ep = gu_next(result, PgfExprProb*, ppool); clock_t end = clock(); double cpu_time_used = ((double) (end - start)) / CLOCKS_PER_SEC; gu_printf(out, err, "%d (%.0f ms): ", ctr, 1000.0 * cpu_time_used); if (ep != NULL) { gu_printf(out, err, "[%.4f] (", ep->prob); pgf_print_expr(ep->expr, NULL, 0, out, err); gu_printf(out, err, ")\n"); } else { gu_printf(out, err, "---\n"); } gu_out_flush(out, err); } fail: gu_pool_free(pool); return status; }