Beispiel #1
0
  static int run_main(int ac, char* av[]) {
    namespace po = boost::program_options;
    try {
      po::options_description generic("Allowed options");

      add(generic)("config-file,c", po::value<std::string>(), "config file name");
      add(generic)("help,h", "produce help message");

      po::options_description hidden("Hidden options");
      hidden.add_options()("input-file", po::value<std::string>(), "input file");

      po::options_description cmdline_options;
      cmdline_options.add(generic).add(hidden);

      po::options_description config_file_options;
      config_file_options.add(generic).add(hidden);

      po::positional_options_description p;
      p.add("input-file", -1);

      po::variables_map vm;
      store(po::command_line_parser(ac, av).options(cmdline_options).positional(p).run(), vm);

      if (vm.count("config-file")) {
        Util::Input ifs(vm["config-file"].as<std::string>());
        store(parse_config_file(*ifs, config_file_options), vm);
        notify(vm);
      }

      if (vm.count("help")) {
        std::cout << generic << "\n\n";
        std::cout << "Convert FSM (in hypergraph format) to OpenFst text format" << '\n';
        return EXIT_FAILURE;
      }

      std::string file;
      if (vm.count("input-file")) {
        file = vm["input-file"].as<std::string>();
      }

      typedef ViterbiWeightTpl<float> Weight;
      typedef Hypergraph::ArcTpl<Weight> Arc;

      IVocabularyPtr pVoc = Vocabulary::createDefaultVocab();

      Util::Input in_(file);

      MutableHypergraph<Arc> hg;
      hg.setVocabulary(pVoc);
      parseText(*in_, file, &hg);

      writeOpenFstFormat(std::cout, hg);

      assert(hg.checkValid());
    } catch (std::exception& e) {
      std::cerr << e.what() << '\n';
      return EXIT_FAILURE;
    }
    return EXIT_SUCCESS;
  }
Beispiel #2
0
int main(int ac, char** av) {
  try {
    sdl::Util::DefaultLocaleFastCout initCout;
    po::options_description generic("Allowed options");
    sdl::AddOption opt(generic);
    opt("config-file", po::value<std::string>(), "config file name");
    opt("symbols", po::value<std::string>(), "FST symbol table to read and use (optional)");
    opt("stem", po::value<std::string>(), "stem for output files");
    opt("help", "produce help message");

    po::options_description hidden("Hidden options");
    hidden.add_options()("input-file", po::value<std::string>(), "input file");

    po::options_description cmdline_options;
    cmdline_options.add(generic).add(hidden);

    po::options_description config_file_options;
    config_file_options.add(generic).add(hidden);

    po::positional_options_description p;
    p.add("input-file", -1);

    po::variables_map vm;
    store(po::command_line_parser(ac, av).options(cmdline_options).positional(p).run(), vm);

    using namespace sdl;
    if (vm.count("config-file")) {
      Util::Input ifs(vm["config-file"].as<std::string>());
      store(parse_config_file(*ifs, config_file_options), vm);
      notify(vm);
    }

    if (vm.count("help")) {
      std::cout << "Convert hypergraph to an OpenFst ReplaceFst object" << '\n';
      std::cout << generic << "\n";
      return EXIT_FAILURE;
    }

#if HAVE_OPENFST
    bool userProvidedSymbolTable = false;
    fst::SymbolTable* syms;
    if (vm.count("symbols")) {
      if (vm.count("stem")) { throw std::runtime_error("Do not provide both --stem and --symbols."); }
      std::string filename = vm["symbols"].as<std::string>();
      syms = fst::SymbolTable::ReadText(filename);
      userProvidedSymbolTable = true;
    } else { syms = new fst::SymbolTable(""); }

    std::string stem;
    if (vm.count("stem")) {
      if (vm.count("symbols")) { throw std::runtime_error("Do not provide both --stem and --symbols."); }
      stem = vm["stem"].as<std::string>();
    } else { stem = "replace"; }

    std::string file;
    if (vm.count("input-file")) { file = vm["input-file"].as<std::string>(); }

    // TODO: set level etc. on cmdline
    sdl::Util::initLogger("HypToReplaceFst", sdl::Util::logLevel(sdl::Util::kLogDebug));

    using namespace sdl;
    using namespace Hypergraph;

    typedef ViterbiWeightTpl<float> Weight;
    typedef ArcTpl<Weight> Arc;

    IVocabularyPtr pVoc = Vocabulary::createDefaultVocab();

    Util::Input in(file);

    MutableHypergraph<Arc> hg;
    hg.setVocabulary(pVoc);
    parseText(*in, file, &hg);
    assert(hg.checkValid());

    // Could also use LogArc and ".log-fst"
    typedef fst::StdArc FArc;
    const std::string fstName = stem + ".std-fst";

    // Convert to OpenFst ReplaceFst:
    // std::pair<const fst::Fst<FArc>*, fst::SymbolTable*> fsPair =
    // sdl::Hypergraph::toReplaceFst<FArc>(hg);
    fst::Fst<FArc>* result = sdl::Hypergraph::toReplaceFst<FArc>(hg, syms);

    // Copy to non-lazy OpenFst object and write to disk
    fst::MutableFst<FArc>* tmp = new fst::VectorFst<FArc>();
    std::cerr << "Expanding Hypergraph (will not terminate if cyclic) ... ";
    *tmp = *result;  // copy
    std::cerr << "Done.\n";

    std::cerr << "Optimizing ... ";
    fst::Project(tmp, fst::PROJECT_OUTPUT);
    fst::RmEpsilon(tmp);
    fst::MutableFst<FArc>* tmp2 = new fst::VectorFst<FArc>();
    *tmp2 = fst::DeterminizeFst<FArc>(*tmp);
    delete tmp;
    tmp = tmp2;
    fst::Minimize(tmp);
    std::cerr << "Done.\n";

    fst::FstWriteOptions opts;

    if (userProvidedSymbolTable) { tmp->Write(std::cout, opts); } else {
      std::cerr << "Writing " << fstName << '\n';
      Util::Output out(fstName);
      tmp->Write(*out, opts);

      const std::string symsName = stem + ".syms";
      std::cerr << "Writing " << symsName << '\n';
      syms->WriteText(symsName);
    }

    delete tmp;
    delete result;
    delete syms;
#else
    std::cerr << "ERROR: Recompile with OpenFst!\n";
    return EXIT_FAILURE;
#endif
  } catch (std::exception& e) {
    std::cerr << e.what() << '\n';
    return EXIT_FAILURE;
  }
  return EXIT_SUCCESS;
}