|
|
// Copyright 2005-2024 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the 'License');
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an 'AS IS' BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// See www.openfst.org for extensive documentation on this weighted
// finite-state transducer library.
//
// Class to complement an FST.
#ifndef FST_COMPLEMENT_H_
#define FST_COMPLEMENT_H_
#include <algorithm>
#include <cstddef>
#include <cstdint>
#include <memory>
#include <string>
#include <vector>
#include <fst/log.h>
#include <fst/arc.h>
#include <fst/float-weight.h>
#include <fst/fst.h>
#include <fst/impl-to-fst.h>
#include <fst/properties.h>
#include <fst/util.h>
namespace fst {
template <class Arc> class ComplementFst;
namespace internal {
// Implementation of delayed ComplementFst. The algorithm used completes the
// (deterministic) FSA and then exchanges final and non-final states.
// Completion, i.e. ensuring that all labels can be read from every state, is
// accomplished by using ρ-labels, which match all labels that are otherwise
// not found leaving a state. The first state in the output is reserved to be a
// new state that is the destination of all ρ-labels. Each remaining output
// state s corresponds to input state s - 1. The first arc in the output at
// these states is the ρ-label, the remaining arcs correspond to the input
// arcs.
template <class A> class ComplementFstImpl : public FstImpl<A> { public: using Arc = A; using Label = typename Arc::Label; using StateId = typename Arc::StateId; using Weight = typename Arc::Weight;
using FstImpl<A>::SetType; using FstImpl<A>::SetProperties; using FstImpl<A>::SetInputSymbols; using FstImpl<A>::SetOutputSymbols;
friend class StateIterator<ComplementFst<Arc>>; friend class ArcIterator<ComplementFst<Arc>>;
explicit ComplementFstImpl(const Fst<Arc> &fst) : fst_(fst.Copy()) { SetType("complement"); const auto props = fst.Properties(kILabelSorted, false); SetProperties(ComplementProperties(props), kCopyProperties); SetInputSymbols(fst.InputSymbols()); SetOutputSymbols(fst.OutputSymbols()); }
ComplementFstImpl(const ComplementFstImpl<Arc> &impl) : fst_(impl.fst_->Copy()) { SetType("complement"); SetProperties(impl.Properties(), kCopyProperties); SetInputSymbols(impl.InputSymbols()); SetOutputSymbols(impl.OutputSymbols()); }
StateId Start() const { if (Properties(kError)) return kNoStateId; const auto start = fst_->Start(); return start != kNoStateId ? start + 1 : 0; }
// Exchange final and non-final states; makes ρ-destination state final.
Weight Final(StateId s) const { if (s == 0 || fst_->Final(s - 1) == Weight::Zero()) { return Weight::One(); } else { return Weight::Zero(); } }
size_t NumArcs(StateId s) const { return s == 0 ? 1 : fst_->NumArcs(s - 1) + 1; }
size_t NumInputEpsilons(StateId s) const { return s == 0 ? 0 : fst_->NumInputEpsilons(s - 1); }
size_t NumOutputEpsilons(StateId s) const { return s == 0 ? 0 : fst_->NumOutputEpsilons(s - 1); }
uint64_t Properties() const override { return Properties(kFstProperties); }
// Sets error if found, and returns other FST impl properties.
uint64_t Properties(uint64_t mask) const override { if ((mask & kError) && fst_->Properties(kError, false)) { SetProperties(kError, kError); } return FstImpl<Arc>::Properties(mask); }
private: std::unique_ptr<const Fst<Arc>> fst_; };
} // namespace internal
// Complements an automaton. This is a library-internal operation that
// introduces a (negative) ρ-label; use Difference/DifferenceFst in user code,
// which will not see this label. This version is a delayed FST.
//
// This class attaches interface to implementation and handles
// reference counting, delegating most methods to ImplToFst.
template <class A> class ComplementFst : public ImplToFst<internal::ComplementFstImpl<A>> { public: using Arc = A; using Label = typename Arc::Label; using StateId = typename Arc::StateId; using Impl = internal::ComplementFstImpl<Arc>;
friend class StateIterator<ComplementFst<Arc>>; friend class ArcIterator<ComplementFst<Arc>>;
explicit ComplementFst(const Fst<Arc> &fst) : ImplToFst<Impl>(std::make_shared<Impl>(fst)) { static constexpr auto props = kUnweighted | kNoEpsilons | kIDeterministic | kAcceptor; if (fst.Properties(props, true) != props) { FSTERROR() << "ComplementFst: Argument not an unweighted " << "epsilon-free deterministic acceptor"; GetImpl()->SetProperties(kError, kError); } }
// See Fst<>::Copy() for doc.
ComplementFst(const ComplementFst &fst, bool safe = false) : ImplToFst<Impl>(fst, safe) {}
// Gets a copy of this FST. See Fst<>::Copy() for further doc.
ComplementFst *Copy(bool safe = false) const override { return new ComplementFst(*this, safe); }
inline void InitStateIterator(StateIteratorData<Arc> *data) const override;
inline void InitArcIterator(StateId s, ArcIteratorData<Arc> *data) const override;
// Label that represents the ρ-transition; we use a negative value private to
// the library and which will preserve FST label sort order.
static constexpr Label kRhoLabel = -2;
private: using ImplToFst<Impl>::GetImpl;
ComplementFst &operator=(const ComplementFst &) = delete; };
// Specialization for ComplementFst.
template <class Arc> class StateIterator<ComplementFst<Arc>> : public StateIteratorBase<Arc> { public: using StateId = typename Arc::StateId;
explicit StateIterator(const ComplementFst<Arc> &fst) : siter_(*fst.GetImpl()->fst_), s_(0) {}
bool Done() const final { return s_ > 0 && siter_.Done(); }
StateId Value() const final { return s_; }
void Next() final { if (s_ != 0) siter_.Next(); ++s_; }
void Reset() final { siter_.Reset(); s_ = 0; }
private: StateIterator<Fst<Arc>> siter_; StateId s_; };
// Specialization for ComplementFst.
template <class Arc> class ArcIterator<ComplementFst<Arc>> : public ArcIteratorBase<Arc> { public: using StateId = typename Arc::StateId; using Weight = typename Arc::Weight;
ArcIterator(const ComplementFst<Arc> &fst, StateId s) : s_(s), pos_(0) { if (s_ != 0) { aiter_ = std::make_unique<ArcIterator<Fst<Arc>>>(*fst.GetImpl()->fst_, s - 1); } }
bool Done() const final { if (s_ != 0) { return pos_ > 0 && aiter_->Done(); } else { return pos_ > 0; } }
// Adds the ρ-label to the ρ destination state.
const Arc &Value() const final { if (pos_ == 0) { arc_.ilabel = arc_.olabel = ComplementFst<Arc>::kRhoLabel; arc_.weight = Weight::One(); arc_.nextstate = 0; } else { arc_ = aiter_->Value(); ++arc_.nextstate; } return arc_; }
void Next() final { if (s_ != 0 && pos_ > 0) aiter_->Next(); ++pos_; }
size_t Position() const final { return pos_; }
void Reset() final { if (s_ != 0) aiter_->Reset(); pos_ = 0; }
void Seek(size_t a) final { if (s_ != 0) { if (a == 0) { aiter_->Reset(); } else { aiter_->Seek(a - 1); } } pos_ = a; }
uint8_t Flags() const final { return kArcValueFlags; }
void SetFlags(uint8_t, uint8_t) final {}
private: std::unique_ptr<ArcIterator<Fst<Arc>>> aiter_; StateId s_; size_t pos_; mutable Arc arc_; };
template <class Arc> inline void ComplementFst<Arc>::InitStateIterator( StateIteratorData<Arc> *data) const { data->base = std::make_unique<StateIterator<ComplementFst<Arc>>>(*this); }
template <class Arc> inline void ComplementFst<Arc>::InitArcIterator( StateId s, ArcIteratorData<Arc> *data) const { data->base = std::make_unique<ArcIterator<ComplementFst<Arc>>>(*this, s); }
// Useful alias when using StdArc.
using StdComplementFst = ComplementFst<StdArc>;
} // namespace fst
#endif // FST_COMPLEMENT_H_
|