1 // pdtcompose.cc
2
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 // http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 //
15 // Copyright 2005-2010 Google, Inc.
16 // Author: riley@google.com (Michael Riley)
17 //
18 // \file
19 // Composes a PDT and an FST.
20 //
21
22 #include <vector>
23 using std::vector;
24 #include <utility>
25 using std::pair; using std::make_pair;
26
27 #include <fst/util.h>
28 #include <fst/extensions/pdt/pdtscript.h>
29 #include <fst/script/connect.h>
30
31 DEFINE_string(pdt_parentheses, "", "PDT parenthesis label pairs.");
32 DEFINE_bool(left_pdt, true, "1st arg is PDT (o.w. 2nd arg).");
33 DEFINE_bool(connect, true, "Trim output");
34 DEFINE_string(compose_filter, "paren",
35 "Composition filter, one of: \"expand\", \"expand_paren\", "
36 "\"paren\"");
37
main(int argc,char ** argv)38 int main(int argc, char **argv) {
39 namespace s = fst::script;
40
41 string usage = "Compose a PDT and an FST.\n\n Usage: ";
42 usage += argv[0];
43 usage += " in.pdt in.fst [out.pdt]\n";
44 usage += " in.fst in.pdt [out.pdt]\n";
45
46 std::set_new_handler(FailedNewHandler);
47 SET_FLAGS(usage.c_str(), &argc, &argv, true);
48 if (argc < 3 || argc > 4) {
49 ShowUsage();
50 return 1;
51 }
52
53 string in1_name = strcmp(argv[1], "-") == 0 ? "" : argv[1];
54 string in2_name = strcmp(argv[2], "-") == 0 ? "" : argv[2];
55 string out_name = argc > 3 ? argv[3] : "";
56
57 if (in1_name.empty() && in2_name.empty()) {
58 LOG(ERROR) << argv[0] << ": Can't take both inputs from standard input.";
59 return 1;
60 }
61
62 s::FstClass *ifst1 = s::FstClass::Read(in1_name);
63 if (!ifst1) return 1;
64 s::FstClass *ifst2 = s::FstClass::Read(in2_name);
65 if (!ifst2) return 1;
66
67 if (FLAGS_pdt_parentheses.empty()) {
68 LOG(ERROR) << argv[0] << ": No PDT parenthesis label pairs provided";
69 return 1;
70 }
71
72 vector<pair<int64, int64> > parens;
73 fst::ReadLabelPairs(FLAGS_pdt_parentheses, &parens, false);
74
75 s::VectorFstClass ofst(ifst1->ArcType());
76
77 fst::PdtComposeFilter compose_filter;
78
79 if (FLAGS_compose_filter == "expand") {
80 compose_filter = fst::EXPAND_FILTER;
81 } else if (FLAGS_compose_filter == "expand_paren") {
82 compose_filter = fst::EXPAND_PAREN_FILTER;
83 } else if (FLAGS_compose_filter == "paren") {
84 compose_filter = fst::PAREN_FILTER;
85 } else {
86 LOG(ERROR) << argv[0] << "Unknown compose filter type: "
87 << FLAGS_compose_filter;
88 return 1;
89 }
90
91 fst::PdtComposeOptions copts(false, compose_filter);
92
93 s::PdtCompose(*ifst1, *ifst2, parens, &ofst, copts, FLAGS_left_pdt);
94
95 if (FLAGS_connect)
96 s::Connect(&ofst);
97 ofst.Write(out_name);
98
99 return 0;
100 }
101