// decoder/lattice-incremental-online-decoder.h // Copyright 2019 Zhehuai Chen // // See ../../COPYING for clarification regarding multiple authors // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE, // MERCHANTABLITY OR NON-INFRINGEMENT. // See the Apache 2 License for the specific language governing permissions and // limitations under the License. // see note at the top of lattice-faster-decoder.h, about how to maintain this // file in sync with lattice-faster-decoder.h #ifndef KALDI_DECODER_LATTICE_INCREMENTAL_ONLINE_DECODER_H_ #define KALDI_DECODER_LATTICE_INCREMENTAL_ONLINE_DECODER_H_ #include "util/stl-utils.h" #include "util/hash-list.h" #include "fst/fstlib.h" #include "itf/decodable-itf.h" #include "fstext/fstext-lib.h" #include "lat/determinize-lattice-pruned.h" #include "lat/kaldi-lattice.h" #include "decoder/lattice-incremental-decoder.h" namespace kaldi { /** LatticeIncrementalOnlineDecoderTpl is as LatticeIncrementalDecoderTpl but also supports an efficient way to get the best path (see the function BestPathEnd()), which is useful in endpointing and in situations where you might want to frequently access the best path. This is only templated on the FST type, since the Token type is required to be BackpointerToken. Actually it only makes sense to instantiate LatticeIncrementalDecoderTpl with Token == BackpointerToken if you do so indirectly via this child class. */ template class LatticeIncrementalOnlineDecoderTpl: public LatticeIncrementalDecoderTpl { public: using Arc = typename FST::Arc; using Label = typename Arc::Label; using StateId = typename Arc::StateId; using Weight = typename Arc::Weight; using Token = decoder::BackpointerToken; using ForwardLinkT = decoder::ForwardLink; // Instantiate this class once for each thing you have to decode. // This version of the constructor does not take ownership of // 'fst'. LatticeIncrementalOnlineDecoderTpl(const FST &fst, const TransitionInformation &trans_model, const LatticeIncrementalDecoderConfig &config): LatticeIncrementalDecoderTpl(fst, trans_model, config) { } // This version of the initializer takes ownership of 'fst', and will delete // it when this object is destroyed. LatticeIncrementalOnlineDecoderTpl(const LatticeIncrementalDecoderConfig &config, FST *fst, const TransitionInformation &trans_model): LatticeIncrementalDecoderTpl(config, fst, trans_model) { } struct BestPathIterator { void *tok; int32 frame; // note, "frame" is the frame-index of the frame you'll get the // transition-id for next time, if you call TraceBackBestPath on this // iterator (assuming it's not an epsilon transition). Note that this // is one less than you might reasonably expect, e.g. it's -1 for // the nonemitting transitions before the first frame. BestPathIterator(void *t, int32 f): tok(t), frame(f) { } bool Done() { return tok == NULL; } }; /// Outputs an FST corresponding to the single best path through the lattice. /// This is quite efficient because it doesn't get the entire raw lattice and find /// the best path through it; instead, it uses the BestPathEnd and BestPathIterator /// so it basically traces it back through the lattice. /// Returns true if result is nonempty (using the return status is deprecated, /// it will become void). If "use_final_probs" is true AND we reached the /// final-state of the graph then it will include those as final-probs, else /// it will treat all final-probs as one. bool GetBestPath(Lattice *ofst, bool use_final_probs = true) const; /// This function returns an iterator that can be used to trace back /// the best path. If use_final_probs == true and at least one final state /// survived till the end, it will use the final-probs in working out the best /// final Token, and will output the final cost to *final_cost (if non-NULL), /// else it will use only the forward likelihood, and will put zero in /// *final_cost (if non-NULL). /// Requires that NumFramesDecoded() > 0. BestPathIterator BestPathEnd(bool use_final_probs, BaseFloat *final_cost = NULL) const; /// This function can be used in conjunction with BestPathEnd() to trace back /// the best path one link at a time (e.g. this can be useful in endpoint /// detection). By "link" we mean a link in the graph; not all links cross /// frame boundaries, but each time you see a nonzero ilabel you can interpret /// that as a frame. The return value is the updated iterator. It outputs /// the ilabel and olabel, and the (graph and acoustic) weight to the "arc" pointer, /// while leaving its "nextstate" variable unchanged. BestPathIterator TraceBackBestPath( BestPathIterator iter, LatticeArc *arc) const; KALDI_DISALLOW_COPY_AND_ASSIGN(LatticeIncrementalOnlineDecoderTpl); }; typedef LatticeIncrementalOnlineDecoderTpl LatticeIncrementalOnlineDecoder; } // end namespace kaldi. #endif