You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 

213 lines
6.3 KiB

// Copyright 2005-2024 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the 'License');
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an 'AS IS' BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// See www.openfst.org for extensive documentation on this weighted
// finite-state transducer library.
//
// Generic FST augmented with state count-interface class definition.
#ifndef FST_EXPANDED_FST_H_
#define FST_EXPANDED_FST_H_
#include <sys/types.h>
#include <cstddef>
#include <ios>
#include <iostream>
#include <istream>
#include <memory>
#include <optional>
#include <string>
#include <vector>
#include <fst/log.h>
#include <fst/arc.h>
#include <fstream>
#include <fst/fst.h>
#include <fst/impl-to-fst.h>
#include <fst/properties.h>
#include <fst/register.h>
namespace fst {
// A generic FST plus state count.
template <class A>
class ExpandedFst : public Fst<A> {
public:
using Arc = A;
using StateId = typename Arc::StateId;
virtual StateId NumStates() const = 0; // State count
std::optional<StateId> NumStatesIfKnown() const override {
return NumStates();
}
// Get a copy of this ExpandedFst. See Fst<>::Copy() for further doc.
ExpandedFst *Copy(bool safe = false) const override = 0;
// Read an ExpandedFst from an input stream; return NULL on error.
static ExpandedFst *Read(std::istream &strm, const FstReadOptions &opts) {
FstReadOptions ropts(opts);
FstHeader hdr;
if (ropts.header) {
hdr = *opts.header;
} else {
if (!hdr.Read(strm, opts.source)) return nullptr;
ropts.header = &hdr;
}
if (!(hdr.Properties() & kExpanded)) {
LOG(ERROR) << "ExpandedFst::Read: Not an ExpandedFst: " << ropts.source;
return nullptr;
}
const auto reader =
FstRegister<Arc>::GetRegister()->GetReader(hdr.FstType());
if (!reader) {
LOG(ERROR) << "ExpandedFst::Read: Unknown FST type \"" << hdr.FstType()
<< "\" (arc type = \"" << A::Type() << "\"): " << ropts.source;
return nullptr;
}
auto *fst = reader(strm, ropts);
if (!fst) return nullptr;
return down_cast<ExpandedFst *>(fst);
}
// Read an ExpandedFst from a file; return NULL on error.
// Empty source reads from standard input.
static ExpandedFst *Read(std::string_view source) {
if (!source.empty()) {
std::ifstream strm(std::string(source),
std::ios_base::in | std::ios_base::binary);
if (!strm) {
LOG(ERROR) << "ExpandedFst::Read: Can't open file: " << source;
return nullptr;
}
return Read(strm, FstReadOptions(source));
} else {
return Read(std::cin, FstReadOptions("standard input"));
}
}
};
namespace internal {
// ExpandedFst<A> case - abstract methods.
template <class Arc>
inline typename Arc::Weight Final(const ExpandedFst<Arc> &fst,
typename Arc::StateId s) {
return fst.Final(s);
}
template <class Arc>
inline ssize_t NumArcs(const ExpandedFst<Arc> &fst, typename Arc::StateId s) {
return fst.NumArcs(s);
}
template <class Arc>
inline ssize_t NumInputEpsilons(const ExpandedFst<Arc> &fst,
typename Arc::StateId s) {
return fst.NumInputEpsilons(s);
}
template <class Arc>
inline ssize_t NumOutputEpsilons(const ExpandedFst<Arc> &fst,
typename Arc::StateId s) {
return fst.NumOutputEpsilons(s);
}
} // namespace internal
// A useful alias when using StdArc.
using StdExpandedFst = ExpandedFst<StdArc>;
// This is a helper class template useful for attaching an ExpandedFst
// interface to its implementation, handling reference counting. It
// delegates to ImplToFst the handling of the Fst interface methods.
template <class Impl, class FST = ExpandedFst<typename Impl::Arc>>
class ImplToExpandedFst : public ImplToFst<Impl, FST> {
public:
using Arc = typename FST::Arc;
using StateId = typename Arc::StateId;
using Weight = typename Arc::Weight;
StateId NumStates() const override { return GetImpl()->NumStates(); }
protected:
using ImplToFst<Impl, FST>::GetImpl;
explicit ImplToExpandedFst(std::shared_ptr<Impl> impl)
: ImplToFst<Impl, FST>(impl) {}
ImplToExpandedFst(const ImplToExpandedFst &fst, bool safe)
: ImplToFst<Impl, FST>(fst, safe) {}
static Impl *Read(std::istream &strm, const FstReadOptions &opts) {
return Impl::Read(strm, opts);
}
// Read FST implementation from a file; return NULL on error.
// Empty source reads from standard input.
static Impl *Read(std::string_view source) {
if (!source.empty()) {
std::ifstream strm(std::string(source),
std::ios_base::in | std::ios_base::binary);
if (!strm) {
LOG(ERROR) << "ExpandedFst::Read: Can't open file: " << source;
return nullptr;
}
return Impl::Read(strm, FstReadOptions(source));
} else {
return Impl::Read(std::cin, FstReadOptions("standard input"));
}
}
};
// Function to return the number of states in an FST, counting them
// if necessary.
template <class Arc>
typename Arc::StateId CountStates(const Fst<Arc> &fst) {
if (std::optional<typename Arc::StateId> num_states =
fst.NumStatesIfKnown()) {
return *num_states;
} else {
typename Arc::StateId nstates = 0;
for (StateIterator<Fst<Arc>> siter(fst); !siter.Done(); siter.Next()) {
++nstates;
}
return nstates;
}
}
// Function to return the number of states in a vector of FSTs, counting them if
// necessary.
template <class Arc>
typename Arc::StateId CountStates(const std::vector<const Fst<Arc> *> &fsts) {
typename Arc::StateId nstates = 0;
for (const auto *fst : fsts) nstates += CountStates(*fst);
return nstates;
}
// Function to return the number of arcs in an FST.
template <class F>
size_t CountArcs(const F &fst) {
size_t narcs = 0;
for (StateIterator<F> siter(fst); !siter.Done(); siter.Next()) {
narcs += fst.NumArcs(siter.Value());
}
return narcs;
}
} // namespace fst
#endif // FST_EXPANDED_FST_H_