|
// Copyright 2005-2024 Google LLC
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the 'License');
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an 'AS IS' BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
// See www.openfst.org for extensive documentation on this weighted
|
|
// finite-state transducer library.
|
|
//
|
|
// Functions and classes to sort arcs in an FST.
|
|
|
|
#ifndef FST_ARCSORT_H_
|
|
#define FST_ARCSORT_H_
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <algorithm>
|
|
#include <cstddef>
|
|
#include <cstdint>
|
|
#include <string>
|
|
#include <tuple>
|
|
#include <vector>
|
|
|
|
#include <fst/arc-map.h>
|
|
#include <fst/arc.h>
|
|
#include <fst/cache.h>
|
|
#include <fst/fst.h>
|
|
#include <fst/mutable-fst.h>
|
|
#include <fst/properties.h>
|
|
#include <fst/state-map.h>
|
|
|
|
namespace fst {
|
|
|
|
template <class Arc, class Compare>
|
|
class ArcSortMapper {
|
|
public:
|
|
using FromArc = Arc;
|
|
using ToArc = Arc;
|
|
|
|
using StateId = typename Arc::StateId;
|
|
using Weight = typename Arc::Weight;
|
|
|
|
constexpr ArcSortMapper(const Fst<Arc> &fst, const Compare &comp)
|
|
: fst_(fst), comp_(comp), i_(0) {}
|
|
|
|
// Allows updating Fst argument; pass only if changed.
|
|
ArcSortMapper(const ArcSortMapper<Arc, Compare> &mapper,
|
|
const Fst<Arc> *fst = nullptr)
|
|
: fst_(fst ? *fst : mapper.fst_), comp_(mapper.comp_), i_(0) {}
|
|
|
|
StateId Start() { return fst_.Start(); }
|
|
|
|
Weight Final(StateId s) const { return fst_.Final(s); }
|
|
|
|
void SetState(StateId s) {
|
|
i_ = 0;
|
|
arcs_.clear();
|
|
arcs_.reserve(fst_.NumArcs(s));
|
|
for (ArcIterator<Fst<Arc>> aiter(fst_, s); !aiter.Done(); aiter.Next()) {
|
|
arcs_.push_back(aiter.Value());
|
|
}
|
|
std::stable_sort(arcs_.begin(), arcs_.end(), comp_);
|
|
}
|
|
|
|
bool Done() const { return i_ >= arcs_.size(); }
|
|
|
|
const Arc &Value() const { return arcs_[i_]; }
|
|
|
|
void Next() { ++i_; }
|
|
|
|
MapSymbolsAction InputSymbolsAction() const { return MAP_COPY_SYMBOLS; }
|
|
|
|
MapSymbolsAction OutputSymbolsAction() const { return MAP_COPY_SYMBOLS; }
|
|
|
|
uint64_t Properties(uint64_t props) const { return comp_.Properties(props); }
|
|
|
|
private:
|
|
const Fst<Arc> &fst_;
|
|
const Compare &comp_;
|
|
std::vector<Arc> arcs_;
|
|
ssize_t i_; // current arc position
|
|
|
|
ArcSortMapper &operator=(const ArcSortMapper &) = delete;
|
|
};
|
|
|
|
// Sorts the arcs in an FST according to function object 'comp' of type Compare.
|
|
// This version modifies its input. Comparison function objects ILabelCompare
|
|
// and OLabelCompare are provided by the library. In general, Compare must meet
|
|
// the requirements for a comparison function object (e.g., similar to those
|
|
// used by std::sort). It must also have a member Properties(uint64_t) that
|
|
// specifies the known properties of the sorted FST; it takes as argument the
|
|
// input FST's known properties before the sort.
|
|
//
|
|
// Complexity:
|
|
//
|
|
// - Time: O(v d log d)
|
|
// - Space: O(d)
|
|
//
|
|
// where v = # of states and d = maximum out-degree.
|
|
template <class Arc, class Compare>
|
|
void ArcSort(MutableFst<Arc> *fst, Compare comp) {
|
|
ArcSortMapper<Arc, Compare> mapper(*fst, comp);
|
|
StateMap(fst, mapper);
|
|
}
|
|
|
|
using ArcSortFstOptions = CacheOptions;
|
|
|
|
// Sorts the arcs in an FST according to function object 'comp' of type Compare.
|
|
// This version is a delayed FST. Comparsion function objects ILabelCompare and
|
|
// OLabelCompare are provided by the library. In general, Compare must meet the
|
|
// requirements for a comparision function object (e.g., similar to those
|
|
// used by std::sort). It must also have a member Properties(uint64_t) that
|
|
// specifies the known properties of the sorted FST; it takes as argument the
|
|
// input FST's known properties.
|
|
//
|
|
// Complexity:
|
|
//
|
|
// - Time: O(v d log d)
|
|
// - Space: O(d)
|
|
//
|
|
// where v = # of states visited, d = maximum out-degree of states visited.
|
|
// Constant time and space to visit an input state is assumed and exclusive of
|
|
// caching.
|
|
template <class Arc, class Compare>
|
|
class ArcSortFst : public StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>> {
|
|
using StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>>::GetImpl;
|
|
|
|
public:
|
|
using StateId = typename Arc::StateId;
|
|
using Mapper = ArcSortMapper<Arc, Compare>;
|
|
|
|
ArcSortFst(const Fst<Arc> &fst, const Compare &comp)
|
|
: StateMapFst<Arc, Arc, Mapper>(fst,
|
|
ArcSortMapper<Arc, Compare>(fst, comp)) {}
|
|
|
|
ArcSortFst(const Fst<Arc> &fst, const Compare &comp,
|
|
const ArcSortFstOptions &opts)
|
|
: StateMapFst<Arc, Arc, Mapper>(fst, Mapper(fst, comp), opts) {}
|
|
|
|
// See Fst<>::Copy() for doc.
|
|
ArcSortFst(const ArcSortFst &fst, bool safe = false)
|
|
: StateMapFst<Arc, Arc, Mapper>(fst, safe) {}
|
|
|
|
// Gets a copy of this ArcSortFst. See Fst<>::Copy() for further doc.
|
|
ArcSortFst *Copy(bool safe = false) const override {
|
|
return new ArcSortFst(*this, safe);
|
|
}
|
|
|
|
size_t NumArcs(StateId s) const override {
|
|
return GetImpl()->GetFst()->NumArcs(s);
|
|
}
|
|
|
|
size_t NumInputEpsilons(StateId s) const override {
|
|
return GetImpl()->GetFst()->NumInputEpsilons(s);
|
|
}
|
|
|
|
size_t NumOutputEpsilons(StateId s) const override {
|
|
return GetImpl()->GetFst()->NumOutputEpsilons(s);
|
|
}
|
|
};
|
|
|
|
// Specialization for ArcSortFst.
|
|
template <class Arc, class Compare>
|
|
class StateIterator<ArcSortFst<Arc, Compare>>
|
|
: public StateIterator<StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>>> {
|
|
public:
|
|
explicit StateIterator(const ArcSortFst<Arc, Compare> &fst)
|
|
: StateIterator<StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>>>(fst) {
|
|
}
|
|
};
|
|
|
|
// Specialization for ArcSortFst.
|
|
template <class Arc, class Compare>
|
|
class ArcIterator<ArcSortFst<Arc, Compare>>
|
|
: public ArcIterator<StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>>> {
|
|
public:
|
|
ArcIterator(const ArcSortFst<Arc, Compare> &fst, typename Arc::StateId s)
|
|
: ArcIterator<StateMapFst<Arc, Arc, ArcSortMapper<Arc, Compare>>>(fst,
|
|
s) {}
|
|
};
|
|
|
|
// Compare class for comparing input labels of arcs.
|
|
template <class Arc>
|
|
class ILabelCompare {
|
|
public:
|
|
constexpr ILabelCompare() = default;
|
|
|
|
constexpr bool operator()(const Arc &lhs, const Arc &rhs) const {
|
|
return std::forward_as_tuple(lhs.ilabel, lhs.olabel) <
|
|
std::forward_as_tuple(rhs.ilabel, rhs.olabel);
|
|
}
|
|
|
|
constexpr uint64_t Properties(uint64_t props) const {
|
|
return (props & kArcSortProperties) | kILabelSorted |
|
|
(props & kAcceptor ? kOLabelSorted : 0);
|
|
}
|
|
};
|
|
|
|
// Compare class for comparing output labels of arcs.
|
|
template <class Arc>
|
|
class OLabelCompare {
|
|
public:
|
|
constexpr OLabelCompare() = default;
|
|
|
|
constexpr bool operator()(const Arc &lhs, const Arc &rhs) const {
|
|
return std::forward_as_tuple(lhs.olabel, lhs.ilabel) <
|
|
std::forward_as_tuple(rhs.olabel, rhs.ilabel);
|
|
}
|
|
|
|
constexpr uint64_t Properties(uint64_t props) const {
|
|
return (props & kArcSortProperties) | kOLabelSorted |
|
|
(props & kAcceptor ? kILabelSorted : 0);
|
|
}
|
|
};
|
|
|
|
// Useful aliases when using StdArc.
|
|
|
|
template <class Compare>
|
|
using StdArcSortFst = ArcSortFst<StdArc, Compare>;
|
|
|
|
using StdILabelCompare = ILabelCompare<StdArc>;
|
|
|
|
using StdOLabelCompare = OLabelCompare<StdArc>;
|
|
|
|
} // namespace fst
|
|
|
|
#endif // FST_ARCSORT_H_
|