blob: 18d849d224b0e9cd48dbf419e90e92947da045e8 [file] [log] [blame]
// pdtexpand.cc
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// Copyright 2005-2010 Google, Inc.
// Author: riley@google.com (Michael Riley)
// Modified: jpr@google.com (Jake Ratkiewicz) to use FstClass
//
// \file
// Expands a (bounded-stack) PDT as an FST.
//
#include <fst/extensions/pdt/pdtscript.h>
#include <fst/util.h>
DEFINE_string(pdt_parentheses, "", "PDT parenthesis label pairs.");
DEFINE_bool(connect, true, "Trim output");
DEFINE_bool(keep_parentheses, false, "Keep PDT parentheses in result.");
DEFINE_string(weight, "", "Weight threshold");
int main(int argc, char **argv) {
namespace s = fst::script;
string usage = "Expand a (bounded-stack) PDT as an FST.\n\n Usage: ";
usage += argv[0];
usage += " in.pdt [out.fst]\n";
std::set_new_handler(FailedNewHandler);
SET_FLAGS(usage.c_str(), &argc, &argv, true);
if (argc > 3) {
ShowUsage();
return 1;
}
string in_name = (argc > 1 && (strcmp(argv[1], "-") != 0)) ? argv[1] : "";
string out_name = argc > 2 ? argv[2] : "";
s::FstClass *ifst = s::FstClass::Read(in_name);
if (!ifst) return 1;
if (FLAGS_pdt_parentheses.empty()) {
LOG(ERROR) << argv[0] << ": No PDT parenthesis label pairs provided";
return 1;
}
vector<pair<int64, int64> > parens;
fst::ReadLabelPairs(FLAGS_pdt_parentheses, &parens, false);
s::WeightClass weight_threshold = FLAGS_weight.empty() ?
s::WeightClass::Zero() :
s::WeightClass(ifst->WeightType(), FLAGS_weight);
s::VectorFstClass ofst(ifst->ArcType());
s::PdtExpand(*ifst, parens, &ofst, s::PdtExpandOptions(
FLAGS_connect, FLAGS_keep_parentheses, weight_threshold));
ofst.Write(out_name);
return 0;
}