|
|
// Copyright 2005-2024 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the 'License');
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an 'AS IS' BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// See www.openfst.org for extensive documentation on this weighted
// finite-state transducer library.
//
// Lexicographic weight set and associated semiring operation definitions.
//
// A lexicographic weight is a sequence of weights, each of which must have the
// path property and Times() must be (strongly) cancellative
// (for all a,b,c != Zero(): Times(c, a) = Times(c, b) => a = b,
// Times(a, c) = Times(b, c) => a = b).
// The + operation on two weights a and b is the lexicographically
// prior of a and b.
#ifndef FST_LEXICOGRAPHIC_WEIGHT_H_
#define FST_LEXICOGRAPHIC_WEIGHT_H_
#include <cstddef>
#include <cstdint>
#include <random>
#include <string>
#include <fst/log.h>
#include <fst/pair-weight.h>
#include <fst/weight.h>
namespace fst {
template <class W1, class W2> class LexicographicWeight : public PairWeight<W1, W2> { public: static_assert(IsPath<W1>::value, "W1 must have path property."); static_assert(IsPath<W2>::value, "W2 must have path property.");
using ReverseWeight = LexicographicWeight<typename W1::ReverseWeight, typename W2::ReverseWeight>;
using PairWeight<W1, W2>::Value1; using PairWeight<W1, W2>::Value2; using PairWeight<W1, W2>::SetValue1; using PairWeight<W1, W2>::SetValue2; using PairWeight<W1, W2>::Zero; using PairWeight<W1, W2>::One; using PairWeight<W1, W2>::NoWeight; using PairWeight<W1, W2>::Quantize; using PairWeight<W1, W2>::Reverse;
LexicographicWeight() = default;
explicit LexicographicWeight(const PairWeight<W1, W2> &w) : PairWeight<W1, W2>(w) {}
LexicographicWeight(W1 w1, W2 w2) : PairWeight<W1, W2>(w1, w2) {}
static const LexicographicWeight &Zero() { static const LexicographicWeight zero(PairWeight<W1, W2>::Zero()); return zero; }
static const LexicographicWeight &One() { static const LexicographicWeight one(PairWeight<W1, W2>::One()); return one; }
static const LexicographicWeight &NoWeight() { static const LexicographicWeight no_weight(PairWeight<W1, W2>::NoWeight()); return no_weight; }
static const std::string &Type() { static const std::string *const type = new std::string(W1::Type() + "_LT_" + W2::Type()); return *type; }
bool Member() const { if (!Value1().Member() || !Value2().Member()) return false; // Lexicographic weights cannot mix zeroes and non-zeroes.
if (Value1() == W1::Zero() && Value2() == W2::Zero()) return true; if (Value1() != W1::Zero() && Value2() != W2::Zero()) return true; return false; }
LexicographicWeight Quantize(float delta = kDelta) const { return LexicographicWeight(PairWeight<W1, W2>::Quantize()); }
ReverseWeight Reverse() const { return ReverseWeight(PairWeight<W1, W2>::Reverse()); }
static constexpr uint64_t Properties() { return W1::Properties() & W2::Properties() & (kLeftSemiring | kRightSemiring | kPath | kIdempotent | kCommutative); } };
template <class W1, class W2> inline LexicographicWeight<W1, W2> Plus(const LexicographicWeight<W1, W2> &w, const LexicographicWeight<W1, W2> &v) { if (!w.Member() || !v.Member()) { return LexicographicWeight<W1, W2>::NoWeight(); } NaturalLess<W1> less1; NaturalLess<W2> less2; if (less1(w.Value1(), v.Value1())) return w; if (less1(v.Value1(), w.Value1())) return v; if (less2(w.Value2(), v.Value2())) return w; if (less2(v.Value2(), w.Value2())) return v; return w; }
template <class W1, class W2> inline LexicographicWeight<W1, W2> Times(const LexicographicWeight<W1, W2> &w, const LexicographicWeight<W1, W2> &v) { return LexicographicWeight<W1, W2>(Times(w.Value1(), v.Value1()), Times(w.Value2(), v.Value2())); }
template <class W1, class W2> inline LexicographicWeight<W1, W2> Divide(const LexicographicWeight<W1, W2> &w, const LexicographicWeight<W1, W2> &v, DivideType typ = DIVIDE_ANY) { return LexicographicWeight<W1, W2>(Divide(w.Value1(), v.Value1(), typ), Divide(w.Value2(), v.Value2(), typ)); }
// This function object generates weights by calling the underlying generators
// for the templated weight types, like all other pair weight types. However,
// for lexicographic weights, we cannot generate zeroes for the two subweights
// separately: weights are members iff both members are zero or both members
// are non-zero. This is intended primarily for testing.
template <class W1, class W2> class WeightGenerate<LexicographicWeight<W1, W2>> { public: using Weight = LexicographicWeight<W1, W1>; using Generate1 = WeightGenerate<W1>; using Generate2 = WeightGenerate<W2>;
explicit WeightGenerate(uint64_t seed = std::random_device()(), bool allow_zero = true, size_t num_random_weights = kNumRandomWeights) : rand_(seed), allow_zero_(allow_zero), num_random_weights_(num_random_weights), generator1_(seed, false, num_random_weights), generator2_(seed, false, num_random_weights) {}
Weight operator()() const { if (allow_zero_) { const int sample = std::uniform_int_distribution<>(0, num_random_weights_)(rand_); if (sample == num_random_weights_) return Weight(W1::Zero(), W2::Zero()); } return Weight(generator1_(), generator2_()); }
private: mutable std::mt19937_64 rand_; const bool allow_zero_; const size_t num_random_weights_; const Generate1 generator1_; const Generate2 generator2_; };
} // namespace fst
#endif // FST_LEXICOGRAPHIC_WEIGHT_H_
|