farprintstrings.cc
2.6 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
// See www.openfst.org for extensive documentation on this weighted
// finite-state transducer library.
//
// Outputs as strings the string FSTs in a finite-state archive.
#include <string>
#include <vector>
#include <fst/flags.h>
#include <fst/extensions/far/farscript.h>
#include <fst/extensions/far/getters.h>
DEFINE_string(filename_prefix, "", "Prefix to append to filenames");
DEFINE_string(filename_suffix, "", "Suffix to append to filenames");
DEFINE_int32(generate_filenames, 0,
"Generate N digit numeric filenames (def: use keys)");
DEFINE_string(begin_key, "",
"First key to extract (def: first key in archive)");
DEFINE_string(end_key, "", "Last key to extract (def: last key in archive)");
// PrintStringsMain specific flag definitions.
DEFINE_bool(print_key, false, "Prefix each string by its key");
DEFINE_bool(print_weight, false, "Suffix each string by its weight");
DEFINE_string(entry_type, "line",
"Entry type: one of : "
"\"file\" (one FST per file), \"line\" (one FST per line)");
DEFINE_string(token_type, "symbol",
"Token type: one of : "
"\"symbol\", \"byte\", \"utf8\"");
DEFINE_string(symbols, "", "Label symbol table");
DEFINE_bool(initial_symbols, true,
"Uses symbol table from the first Fst in archive for all entries.");
int main(int argc, char **argv) {
namespace s = fst::script;
string usage = "Print as string the string FSTs in an archive.\n\n Usage:";
usage += argv[0];
usage += " [in1.far in2.far ...]\n";
std::set_new_handler(FailedNewHandler);
SET_FLAGS(usage.c_str(), &argc, &argv, true);
s::ExpandArgs(argc, argv, &argc, &argv);
std::vector<string> in_fnames;
for (int i = 1; i < argc; ++i) in_fnames.push_back(argv[i]);
if (in_fnames.empty()) in_fnames.push_back("");
const auto arc_type = s::LoadArcTypeFromFar(in_fnames[0]);
if (arc_type.empty()) return 1;
fst::FarEntryType entry_type;
if (!s::GetFarEntryType(FLAGS_entry_type, &entry_type)) {
LOG(ERROR) << "Unknown or unsupported FAR entry type: " << FLAGS_entry_type;
return 1;
}
fst::FarTokenType token_type;
if (!s::GetFarTokenType(FLAGS_token_type, &token_type)) {
LOG(ERROR) << "Unknown or unsupported FAR token type: " << FLAGS_token_type;
return 1;
}
s::FarPrintStrings(in_fnames, arc_type, entry_type, token_type,
FLAGS_begin_key, FLAGS_end_key, FLAGS_print_key,
FLAGS_print_weight, FLAGS_symbols, FLAGS_initial_symbols,
FLAGS_generate_filenames, FLAGS_filename_prefix,
FLAGS_filename_suffix);
return 0;
}