// See www.openfst.org for extensive documentation on this weighted
|
// finite-state transducer library.
|
|
#ifndef FST_EXTENSIONS_SPECIAL_SIGMA_FST_H_
|
#define FST_EXTENSIONS_SPECIAL_SIGMA_FST_H_
|
|
#include <memory>
|
#include <string>
|
|
#include <fst/const-fst.h>
|
#include <fst/matcher-fst.h>
|
#include <fst/matcher.h>
|
|
DECLARE_int64(sigma_fst_sigma_label);
|
DECLARE_string(sigma_fst_rewrite_mode);
|
|
namespace fst {
|
namespace internal {
|
|
template <class Label>
|
class SigmaFstMatcherData {
|
public:
|
explicit SigmaFstMatcherData(Label sigma_label = FLAGS_sigma_fst_sigma_label,
|
MatcherRewriteMode rewrite_mode =
|
RewriteMode(FLAGS_sigma_fst_rewrite_mode))
|
: sigma_label_(sigma_label), rewrite_mode_(rewrite_mode) {}
|
|
SigmaFstMatcherData(const SigmaFstMatcherData &data)
|
: sigma_label_(data.sigma_label_), rewrite_mode_(data.rewrite_mode_) {}
|
|
static SigmaFstMatcherData<Label> *Read(std::istream &istrm,
|
const FstReadOptions &read) {
|
auto *data = new SigmaFstMatcherData<Label>();
|
ReadType(istrm, &data->sigma_label_);
|
int32 rewrite_mode;
|
ReadType(istrm, &rewrite_mode);
|
data->rewrite_mode_ = static_cast<MatcherRewriteMode>(rewrite_mode);
|
return data;
|
}
|
|
bool Write(std::ostream &ostrm, const FstWriteOptions &opts) const {
|
WriteType(ostrm, sigma_label_);
|
WriteType(ostrm, static_cast<int32>(rewrite_mode_));
|
return !ostrm ? false : true;
|
}
|
|
Label SigmaLabel() const { return sigma_label_; }
|
|
MatcherRewriteMode RewriteMode() const { return rewrite_mode_; }
|
|
private:
|
static MatcherRewriteMode RewriteMode(const string &mode) {
|
if (mode == "auto") return MATCHER_REWRITE_AUTO;
|
if (mode == "always") return MATCHER_REWRITE_ALWAYS;
|
if (mode == "never") return MATCHER_REWRITE_NEVER;
|
LOG(WARNING) << "SigmaFst: Unknown rewrite mode: " << mode << ". "
|
<< "Defaulting to auto.";
|
return MATCHER_REWRITE_AUTO;
|
}
|
|
Label sigma_label_;
|
MatcherRewriteMode rewrite_mode_;
|
};
|
|
} // namespace internal
|
|
constexpr uint8 kSigmaFstMatchInput = 0x01; // Input matcher is SigmaMatcher.
|
constexpr uint8 kSigmaFstMatchOutput = 0x02; // Output matcher is SigmaMatcher.
|
|
template <class M, uint8 flags = kSigmaFstMatchInput | kSigmaFstMatchOutput>
|
class SigmaFstMatcher : public SigmaMatcher<M> {
|
public:
|
using FST = typename M::FST;
|
using Arc = typename M::Arc;
|
using StateId = typename Arc::StateId;
|
using Label = typename Arc::Label;
|
using Weight = typename Arc::Weight;
|
using MatcherData = internal::SigmaFstMatcherData<Label>;
|
|
enum : uint8 { kFlags = flags };
|
|
// This makes a copy of the FST.
|
SigmaFstMatcher(
|
const FST &fst, MatchType match_type,
|
std::shared_ptr<MatcherData> data = std::make_shared<MatcherData>())
|
: SigmaMatcher<M>(
|
fst, match_type,
|
SigmaLabel(match_type,
|
data ? data->SigmaLabel() : MatcherData().SigmaLabel()),
|
data ? data->RewriteMode() : MatcherData().RewriteMode()),
|
data_(data) {}
|
|
// This doesn't copy the FST.
|
SigmaFstMatcher(
|
const FST *fst, MatchType match_type,
|
std::shared_ptr<MatcherData> data = std::make_shared<MatcherData>())
|
: SigmaMatcher<M>(
|
fst, match_type,
|
SigmaLabel(match_type,
|
data ? data->SigmaLabel() : MatcherData().SigmaLabel()),
|
data ? data->RewriteMode() : MatcherData().RewriteMode()),
|
data_(data) {}
|
|
// This makes a copy of the FST.
|
SigmaFstMatcher(const SigmaFstMatcher<M, flags> &matcher, bool safe = false)
|
: SigmaMatcher<M>(matcher, safe), data_(matcher.data_) {}
|
|
SigmaFstMatcher<M, flags> *Copy(bool safe = false) const override {
|
return new SigmaFstMatcher<M, flags>(*this, safe);
|
}
|
|
const MatcherData *GetData() const { return data_.get(); }
|
|
std::shared_ptr<MatcherData> GetSharedData() const { return data_; }
|
|
private:
|
static Label SigmaLabel(MatchType match_type, Label label) {
|
if (match_type == MATCH_INPUT && flags & kSigmaFstMatchInput) return label;
|
if (match_type == MATCH_OUTPUT && flags & kSigmaFstMatchOutput)
|
return label;
|
return kNoLabel;
|
}
|
|
std::shared_ptr<MatcherData> data_;
|
};
|
|
extern const char sigma_fst_type[];
|
extern const char input_sigma_fst_type[];
|
extern const char output_sigma_fst_type[];
|
|
using StdSigmaFst = MatcherFst<ConstFst<StdArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<StdArc>>>,
|
sigma_fst_type>;
|
|
using LogSigmaFst = MatcherFst<ConstFst<LogArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<LogArc>>>,
|
sigma_fst_type>;
|
|
using Log64SigmaFst =
|
MatcherFst<ConstFst<Log64Arc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<Log64Arc>>>,
|
input_sigma_fst_type>;
|
|
using StdInputSigmaFst = MatcherFst<
|
ConstFst<StdArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<StdArc>>, kSigmaFstMatchInput>,
|
input_sigma_fst_type>;
|
|
using LogInputSigmaFst = MatcherFst<
|
ConstFst<LogArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<LogArc>>, kSigmaFstMatchInput>,
|
input_sigma_fst_type>;
|
|
using Log64InputSigmaFst = MatcherFst<
|
ConstFst<Log64Arc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<Log64Arc>>, kSigmaFstMatchInput>,
|
input_sigma_fst_type>;
|
|
using StdOutputSigmaFst = MatcherFst<
|
ConstFst<StdArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<StdArc>>, kSigmaFstMatchOutput>,
|
output_sigma_fst_type>;
|
|
using LogOutputSigmaFst = MatcherFst<
|
ConstFst<LogArc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<LogArc>>, kSigmaFstMatchOutput>,
|
output_sigma_fst_type>;
|
|
using Log64OutputSigmaFst = MatcherFst<
|
ConstFst<Log64Arc>,
|
SigmaFstMatcher<SortedMatcher<ConstFst<Log64Arc>>, kSigmaFstMatchOutput>,
|
output_sigma_fst_type>;
|
|
} // namespace fst
|
|
#endif // FST_EXTENSIONS_SPECIAL_SIGMA_FST_H_
|