blob: f46116f9f44cc150619f99aa0fb330281debd501 [file] [log] [blame]
// intersect.h
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// Copyright 2005-2010 Google, Inc.
// Author: riley@google.com (Michael Riley)
//
// \file
// Class to compute the intersection of two FSAs
#ifndef FST_LIB_INTERSECT_H__
#define FST_LIB_INTERSECT_H__
#include <algorithm>
#include <vector>
using std::vector;
#include <fst/cache.h>
#include <fst/compose.h>
namespace fst {
template <class A,
class M = Matcher<Fst<A> >,
class F = SequenceComposeFilter<M>,
class T = GenericComposeStateTable<A, typename F::FilterState> >
struct IntersectFstOptions : public ComposeFstOptions<A, M, F, T> {
explicit IntersectFstOptions(const CacheOptions &opts,
M *mat1 = 0, M *mat2 = 0,
F *filt = 0, T *sttable= 0)
: ComposeFstOptions<A, M, F, T>(opts, mat1, mat2, filt, sttable) { }
IntersectFstOptions() {}
};
// Computes the intersection (Hadamard product) of two FSAs. This
// version is a delayed Fst. Only strings that are in both automata
// are retained in the result.
//
// The two arguments must be acceptors. One of the arguments must be
// label-sorted.
//
// Complexity: same as ComposeFst.
//
// Caveats: same as ComposeFst.
template <class A>
class IntersectFst : public ComposeFst<A> {
public:
using ComposeFst<A>::CreateBase;
using ComposeFst<A>::CreateBase1;
using ComposeFst<A>::Properties;
using ImplToFst< ComposeFstImplBase<A> >::GetImpl;
using ImplToFst< ComposeFstImplBase<A> >::SetImpl;
typedef A Arc;
typedef typename A::Weight Weight;
typedef typename A::StateId StateId;
IntersectFst(const Fst<A> &fst1, const Fst<A> &fst2,
const CacheOptions opts = CacheOptions()) {
bool acceptors = fst1.Properties(kAcceptor, true) &&
fst2.Properties(kAcceptor, true);
SetImpl(CreateBase(fst1, fst2, opts));
if (!acceptors) {
FSTERROR() << "IntersectFst: input FSTs are not acceptors";
GetImpl()->SetProperties(kError);
}
}
template <class M, class F, class T>
IntersectFst(const Fst<A> &fst1, const Fst<A> &fst2,
const IntersectFstOptions<A, M, F, T> &opts) {
bool acceptors = fst1.Properties(kAcceptor, true) &&
fst2.Properties(kAcceptor, true);
SetImpl(CreateBase1(fst1, fst2, opts));
if (!acceptors) {
FSTERROR() << "IntersectFst: input FSTs are not acceptors";
GetImpl()->SetProperties(kError);
}
}
// See Fst<>::Copy() for doc.
IntersectFst(const IntersectFst<A> &fst, bool safe = false) :
ComposeFst<A>(fst, safe) {}
// Get a copy of this IntersectFst. See Fst<>::Copy() for further doc.
virtual IntersectFst<A> *Copy(bool safe = false) const {
return new IntersectFst<A>(*this, safe);
}
};
// Specialization for IntersectFst.
template <class A>
class StateIterator< IntersectFst<A> >
: public StateIterator< ComposeFst<A> > {
public:
explicit StateIterator(const IntersectFst<A> &fst)
: StateIterator< ComposeFst<A> >(fst) {}
};
// Specialization for IntersectFst.
template <class A>
class ArcIterator< IntersectFst<A> >
: public ArcIterator< ComposeFst<A> > {
public:
typedef typename A::StateId StateId;
ArcIterator(const IntersectFst<A> &fst, StateId s)
: ArcIterator< ComposeFst<A> >(fst, s) {}
};
// Useful alias when using StdArc.
typedef IntersectFst<StdArc> StdIntersectFst;
typedef ComposeOptions IntersectOptions;
// Computes the intersection (Hadamard product) of two FSAs. This
// version writes the intersection to an output MurableFst. Only
// strings that are in both automata are retained in the result.
//
// The two arguments must be acceptors. One of the arguments must be
// label-sorted.
//
// Complexity: same as Compose.
//
// Caveats: same as Compose.
template<class Arc>
void Intersect(const Fst<Arc> &ifst1, const Fst<Arc> &ifst2,
MutableFst<Arc> *ofst,
const IntersectOptions &opts = IntersectOptions()) {
typedef Matcher< Fst<Arc> > M;
if (opts.filter_type == AUTO_FILTER) {
CacheOptions nopts;
nopts.gc_limit = 0; // Cache only the last state for fastest copy.
*ofst = IntersectFst<Arc>(ifst1, ifst2, nopts);
} else if (opts.filter_type == SEQUENCE_FILTER) {
IntersectFstOptions<Arc> iopts;
iopts.gc_limit = 0; // Cache only the last state for fastest copy.
*ofst = IntersectFst<Arc>(ifst1, ifst2, iopts);
} else if (opts.filter_type == ALT_SEQUENCE_FILTER) {
IntersectFstOptions<Arc, M, AltSequenceComposeFilter<M> > iopts;
iopts.gc_limit = 0; // Cache only the last state for fastest copy.
*ofst = IntersectFst<Arc>(ifst1, ifst2, iopts);
} else if (opts.filter_type == MATCH_FILTER) {
IntersectFstOptions<Arc, M, MatchComposeFilter<M> > iopts;
iopts.gc_limit = 0; // Cache only the last state for fastest copy.
*ofst = IntersectFst<Arc>(ifst1, ifst2, iopts);
}
if (opts.connect)
Connect(ofst);
}
} // namespace fst
#endif // FST_LIB_INTERSECT_H__